flat
nested
lists
sparse
complex
books
countries
large_mixed
large_num
large_text
mcp_tools
simple_flat.json — Original: 763 chars — Tokenizer: gpt2 (openai-community/gpt2)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)7633842.02.0
JSON (min)5221525.03.4
CSV234958.02.5
TSV234958.02.5
YAML4891634.73.0
TOON246987.82.5
TSON229908.52.5
minemizer2517410.33.4
minemizer (compact)224859.02.6
JSON (pretty)
chars: 763 tokens: 384 chars_og/tok: 2.0 enc_chars/tok: 2.0
[
· {
··· "id": 1,
··· "name": "Alice",
··· "role": "Engineer",
··· "department": "Backend"
· },
· {
··· "id": 2,
··· "name": "Bob",
··· "role": "Designer",
··· "department": "Frontend"
· },
· {
··· "id": 3,
··· "name": "Carol",
··· "role": "Manager",
··· "department": "Product"
· },
· {
··· "id": 4,
··· "name": "David",
··· "role": "Engineer",
··· "department": "Infrastructure"
· },
... (truncated)
JSON (min)
chars: 522 tokens: 152 chars_og/tok: 5.0 enc_chars/tok: 3.4
[{"id":1,"name":"Alice","role":"Engineer","department":"Backend"},{"id":2,"name":"Bob","role":"Designer","department":"Frontend"},{"id":3,"name":"Carol","role":"Manager","department":"Product"},{"id":4,"name":"David","role":"Engineer","department":"Infrastructure"},{"id":5,"name":"Eva","role":"Analyst","department":"Data"},{"id":6,"name":"Frank","role":"Engineer","department":"Backend"},{"id":7,"name":"Grace","role":"Designer","department":"Mobile"},{"id":8,"name":"Henry","role":"Manager","department":"Engineering"}]
CSV
chars: 234 tokens: 95 chars_og/tok: 8.0 enc_chars/tok: 2.5
id,name,role,department
1,Alice,Engineer,Backend
2,Bob,Designer,Frontend
3,Carol,Manager,Product
4,David,Engineer,Infrastructure
5,Eva,Analyst,Data
6,Frank,Engineer,Backend
7,Grace,Designer,Mobile
8,Henry,Manager,Engineering
TSV
chars: 234 tokens: 95 chars_og/tok: 8.0 enc_chars/tok: 2.5
idnameroledepartment
1AliceEngineerBackend
2BobDesignerFrontend
3CarolManagerProduct
4DavidEngineerInfrastructure
5EvaAnalystData
6FrankEngineerBackend
7GraceDesignerMobile
8HenryManagerEngineering
YAML
chars: 489 tokens: 163 chars_og/tok: 4.7 enc_chars/tok: 3.0
- department: Backend
· id: 1
· name: Alice
· role: Engineer
- department: Frontend
· id: 2
· name: Bob
· role: Designer
- department: Product
· id: 3
· name: Carol
· role: Manager
- department: Infrastructure
· id: 4
· name: David
· role: Engineer
- department: Data
· id: 5
· name: Eva
· role: Analyst
- department: Backend
· id: 6
· name: Frank
· role: Engineer
- department: Mobile
... (truncated)
TOON
chars: 246 tokens: 98 chars_og/tok: 7.8 enc_chars/tok: 2.5
[8]{id,name,role,department}:
· 1,Alice,Engineer,Backend
· 2,Bob,Designer,Frontend
· 3,Carol,Manager,Product
· 4,David,Engineer,Infrastructure
· 5,Eva,Analyst,Data
· 6,Frank,Engineer,Backend
· 7,Grace,Designer,Mobile
· 8,Henry,Manager,Engineering
TSON
chars: 229 tokens: 90 chars_og/tok: 8.5 enc_chars/tok: 2.5
{@id,name,role,department#8|1,Alice,Engineer,Backend|2,Bob,Designer,Frontend|3,Carol,Manager,Product|4,David,Engineer,Infrastructure|5,Eva,Analyst,Data|6,Frank,Engineer,Backend|7,Grace,Designer,Mobile|8,Henry,Manager,Engineering}
minemizer
chars: 251 tokens: 74 chars_og/tok: 10.3 enc_chars/tok: 3.4
id; name; role; department
1; Alice; Engineer; Backend
2; Bob; Designer; Frontend
3; Carol; Manager; Product
4; David; Engineer; Infrastructure
5; Eva; Analyst; Data
6; Frank; Engineer; Backend
7; Grace; Designer; Mobile
8; Henry; Manager; Engineering
minemizer (compact)
chars: 224 tokens: 85 chars_og/tok: 9.0 enc_chars/tok: 2.6
id;name;role;department
1;Alice;Engineer;Backend
2;Bob;Designer;Frontend
3;Carol;Manager;Product
4;David;Engineer;Infrastructure
5;Eva;Analyst;Data
6;Frank;Engineer;Backend
7;Grace;Designer;Mobile
8;Henry;Manager;Engineering
nested_objects.json — Original: 1039 chars — Tokenizer: gpt2 (openai-community/gpt2)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)1,0395901.81.8
JSON (min)6181885.53.3
CSVN/A
TSVN/A
YAML6292643.92.4
TOON6753153.32.1
TSON3061367.62.2
minemizer3251268.22.6
minemizer (compact)2901327.92.2
JSON (pretty)
chars: 1,039 tokens: 590 chars_og/tok: 1.8 enc_chars/tok: 1.8
[
· {
··· "id": "u1",
··· "name": "Lukas",
··· "location": {
····· "office": "Kaunas HQ",
····· "floor": 12
··· },
··· "skills": [
····· "python",
····· "kubernetes"
··· ]
· },
· {
··· "id": "u2",
··· "name": "Emma",
··· "location": {
····· "office": "Boston Hub",
····· "floor": 7
··· },
··· "skills": [
····· "react",
····· "typescript",
····· "graphql"
··· ]
... (truncated)
JSON (min)
chars: 618 tokens: 188 chars_og/tok: 5.5 enc_chars/tok: 3.3
[{"id":"u1","name":"Lukas","location":{"office":"Kaunas HQ","floor":12},"skills":["python","kubernetes"]},{"id":"u2","name":"Emma","location":{"office":"Boston Hub","floor":7},"skills":["react","typescript","graphql"]},{"id":"u3","name":"Pierre","location":{"office":"Paris Office","floor":3},"skills":["rust"]},{"id":"u4","name":"Hana","location":{"office":"Tokyo Tower","floor":15},"skills":["go","docker"]},{"id":"u5","name":"Wei","location":{"office":"Taipei Center","floor":8},"skills":["java","spring"]},{"id":"u6","name":"Charlotte","location":{"office":"London Bridge","floor":5},"skills":["python","django"]}]
CSV: N/A
TSV: N/A
YAML
chars: 629 tokens: 264 chars_og/tok: 3.9 enc_chars/tok: 2.4
- id: u1
· location:
··· floor: 12
··· office: Kaunas HQ
· name: Lukas
· skills:
· - python
· - kubernetes
- id: u2
· location:
··· floor: 7
··· office: Boston Hub
· name: Emma
· skills:
· - react
· - typescript
· - graphql
- id: u3
· location:
··· floor: 3
··· office: Paris Office
· name: Pierre
· skills:
· - rust
- id: u4
... (truncated)
TOON
chars: 675 tokens: 315 chars_og/tok: 3.3 enc_chars/tok: 2.1
[6]:
· - id: u1
··· name: Lukas
··· location:
····· office: Kaunas HQ
····· floor: 12
··· skills[2]: python,kubernetes
· - id: u2
··· name: Emma
··· location:
····· office: Boston Hub
····· floor: 7
··· skills[3]: react,typescript,graphql
· - id: u3
··· name: Pierre
··· location:
····· office: Paris Office
····· floor: 3
··· skills[1]: rust
· - id: u4
··· name: Hana
··· location:
····· office: Tokyo Tower
····· floor: 15
··· skills[2]: go,docker
... (truncated)
TSON
chars: 306 tokens: 136 chars_og/tok: 7.6 enc_chars/tok: 2.2
{@id,name,location(@office,floor),skills#6|u1,Lukas,{"Kaunas HQ",12},[python,kubernetes]|u2,Emma,{"Boston Hub",7},[react,typescript,graphql]|u3,Pierre,{"Paris Office",3},[rust]|u4,Hana,{"Tokyo Tower",15},[go,docker]|u5,Wei,{"Taipei Center",8},[java,spring]|u6,Charlotte,{"London Bridge",5},[python,django]}
minemizer
chars: 325 tokens: 126 chars_og/tok: 8.2 enc_chars/tok: 2.6
id; name; location{ office; floor}; skills[]
u1; Lukas;{ Kaunas HQ; 12};[ python; kubernetes]
u2; Emma;{ Boston Hub; 7};[ react; typescript; graphql]
u3; Pierre;{ Paris Office; 3};[ rust]
u4; Hana;{ Tokyo Tower; 15};[ go; docker]
u5; Wei;{ Taipei Center; 8};[ java; spring]
u6; Charlotte;{ London Bridge; 5};[ python; django]
minemizer (compact)
chars: 290 tokens: 132 chars_og/tok: 7.9 enc_chars/tok: 2.2
id;name;location{office;floor};skills[]
u1;Lukas;{Kaunas HQ;12};[python;kubernetes]
u2;Emma;{Boston Hub;7};[react;typescript;graphql]
u3;Pierre;{Paris Office;3};[rust]
u4;Hana;{Tokyo Tower;15};[go;docker]
u5;Wei;{Taipei Center;8};[java;spring]
u6;Charlotte;{London Bridge;5};[python;django]
lists_of_primitives.json — Original: 610 chars — Tokenizer: gpt2 (openai-community/gpt2)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)6103821.61.6
JSON (min)3301155.32.9
CSVN/A
TSVN/A
YAML3411534.02.2
TOON3391613.82.1
TSON168807.62.1
minemizer188817.52.3
minemizer (compact)165837.32.0
JSON (pretty)
chars: 610 tokens: 382 chars_og/tok: 1.6 enc_chars/tok: 1.6
[
· {
··· "id": 1,
··· "name": "Alice",
··· "skills": [
····· "python",
····· "go",
····· "rust"
··· ]
· },
· {
··· "id": 2,
··· "name": "Bob",
··· "skills": [
····· "javascript",
····· "typescript"
··· ]
· },
· {
··· "id": 3,
··· "name": "Carol",
··· "skills": [
····· "java",
····· "kotlin",
····· "scala",
... (truncated)
JSON (min)
chars: 330 tokens: 115 chars_og/tok: 5.3 enc_chars/tok: 2.9
[{"id":1,"name":"Alice","skills":["python","go","rust"]},{"id":2,"name":"Bob","skills":["javascript","typescript"]},{"id":3,"name":"Carol","skills":["java","kotlin","scala","groovy"]},{"id":4,"name":"David","skills":["c","cpp"]},{"id":5,"name":"Eva","skills":["ruby","elixir","erlang"]},{"id":6,"name":"Frank","skills":["swift"]}]
CSV: N/A
TSV: N/A
YAML
chars: 341 tokens: 153 chars_og/tok: 4.0 enc_chars/tok: 2.2
- id: 1
· name: Alice
· skills:
· - python
· - go
· - rust
- id: 2
· name: Bob
· skills:
· - javascript
· - typescript
- id: 3
· name: Carol
· skills:
· - java
· - kotlin
· - scala
· - groovy
- id: 4
· name: David
· skills:
· - c
· - cpp
- id: 5
· name: Eva
... (truncated)
TOON
chars: 339 tokens: 161 chars_og/tok: 3.8 enc_chars/tok: 2.1
[6]:
· - id: 1
··· name: Alice
··· skills[3]: python,go,rust
· - id: 2
··· name: Bob
··· skills[2]: javascript,typescript
· - id: 3
··· name: Carol
··· skills[4]: java,kotlin,scala,groovy
· - id: 4
··· name: David
··· skills[2]: c,cpp
· - id: 5
··· name: Eva
··· skills[3]: ruby,elixir,erlang
· - id: 6
··· name: Frank
··· skills[1]: swift
TSON
chars: 168 tokens: 80 chars_og/tok: 7.6 enc_chars/tok: 2.1
{@id,name,skills#6|1,Alice,[python,go,rust]|2,Bob,[javascript,typescript]|3,Carol,[java,kotlin,scala,groovy]|4,David,[c,cpp]|5,Eva,[ruby,elixir,erlang]|6,Frank,[swift]}
minemizer
chars: 188 tokens: 81 chars_og/tok: 7.5 enc_chars/tok: 2.3
id; name; skills[]
1; Alice;[ python; go; rust]
2; Bob;[ javascript; typescript]
3; Carol;[ java; kotlin; scala; groovy]
4; David;[ c; cpp]
5; Eva;[ ruby; elixir; erlang]
6; Frank;[ swift]
minemizer (compact)
chars: 165 tokens: 83 chars_og/tok: 7.3 enc_chars/tok: 2.0
id;name;skills[]
1;Alice;[python;go;rust]
2;Bob;[javascript;typescript]
3;Carol;[java;kotlin;scala;groovy]
4;David;[c;cpp]
5;Eva;[ruby;elixir;erlang]
6;Frank;[swift]
sparse_data.json — Original: 611 chars — Tokenizer: gpt2 (openai-community/gpt2)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)6113231.91.9
JSON (min)4001314.73.1
CSVN/A
TSVN/A
YAML3841454.22.6
TOON4381903.22.3
TSON3281464.22.2
minemizer200728.52.8
minemizer (compact)180827.52.2
JSON (pretty)
chars: 611 tokens: 323 chars_og/tok: 1.9 enc_chars/tok: 1.9
[
· {
··· "id": 1,
··· "name": "Erik",
··· "department": "Engineering"
· },
· {
··· "id": 2,
··· "name": "Rachel",
··· "department": "Design",
··· "remote": true
· },
· {
··· "id": 3,
··· "name": "Hans"
· },
· {
··· "id": 4,
··· "name": "Kenji",
··· "department": "Sales",
··· "slack": "@kenji",
··· "remote": false
· },
· {
··· "id": 5,
... (truncated)
JSON (min)
chars: 400 tokens: 131 chars_og/tok: 4.7 enc_chars/tok: 3.1
[{"id":1,"name":"Erik","department":"Engineering"},{"id":2,"name":"Rachel","department":"Design","remote":true},{"id":3,"name":"Hans"},{"id":4,"name":"Kenji","department":"Sales","slack":"@kenji","remote":false},{"id":5,"name":"Mai","remote":true},{"id":6,"name":"Tom","department":"Engineering"},{"id":7,"name":"Priya","slack":"@priya","remote":true},{"id":8,"name":"Nina","department":"Marketing"}]
CSV: N/A
TSV: N/A
YAML
chars: 384 tokens: 145 chars_og/tok: 4.2 enc_chars/tok: 2.6
- department: Engineering
· id: 1
· name: Erik
- department: Design
· id: 2
· name: Rachel
· remote: true
- id: 3
· name: Hans
- department: Sales
· id: 4
· name: Kenji
· remote: false
· slack: '@kenji'
- id: 5
· name: Mai
· remote: true
- department: Engineering
· id: 6
· name: Tom
- id: 7
· name: Priya
· remote: true
· slack: '@priya'
- department: Marketing
... (truncated)
TOON
chars: 438 tokens: 190 chars_og/tok: 3.2 enc_chars/tok: 2.3
[8]:
· - id: 1
··· name: Erik
··· department: Engineering
· - id: 2
··· name: Rachel
··· department: Design
··· remote: true
· - id: 3
··· name: Hans
· - id: 4
··· name: Kenji
··· department: Sales
··· slack: @kenji
··· remote: false
· - id: 5
··· name: Mai
··· remote: true
· - id: 6
··· name: Tom
··· department: Engineering
· - id: 7
··· name: Priya
··· slack: @priya
··· remote: true
... (truncated)
TSON
chars: 328 tokens: 146 chars_og/tok: 4.2 enc_chars/tok: 2.2
[{@id,name,department|1,Erik,Engineering},{@id,name,department,remote|2,Rachel,Design,true},{@id,name|3,Hans},{@id,name,department,slack,remote|4,Kenji,Sales,"@kenji",false},{@id,name,remote|5,Mai,true},{@id,name,department|6,Tom,Engineering},{@id,name,slack,remote|7,Priya,"@priya",true},{@id,name,department|8,Nina,Marketing}]
minemizer
chars: 200 tokens: 72 chars_og/tok: 8.5 enc_chars/tok: 2.8
id; name; department; remote
1; Erik; Engineering
2; Rachel; Design;true
3; Hans
4; Kenji; Sales;false; slack: @kenji
5; Mai;;true
6; Tom; Engineering
7; Priya;;true; slack: @priya
8; Nina; Marketing;
minemizer (compact)
chars: 180 tokens: 82 chars_og/tok: 7.5 enc_chars/tok: 2.2
id;name;department;remote
1;Erik;Engineering
2;Rachel;Design;true
3;Hans
4;Kenji;Sales;false;slack:@kenji
5;Mai;;true
6;Tom;Engineering
7;Priya;;true;slack:@priya
8;Nina;Marketing;
complex_mixed.json — Original: 1320 chars — Tokenizer: gpt2 (openai-community/gpt2)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)1,3207681.71.7
JSON (min)7602245.93.4
CSVN/A
TSVN/A
YAML8183743.52.2
TOON8814343.02.0
TSON4532076.42.2
minemizer4031578.42.6
minemizer (compact)3611737.62.1
JSON (pretty)
chars: 1,320 tokens: 768 chars_og/tok: 1.7 enc_chars/tok: 1.7
[
· {
··· "id": 1,
··· "profile": {
····· "name": "Grace",
····· "location": {
······· "city": "NYC",
······· "country": "USA"
····· }
··· },
··· "tags": [
····· "admin",
····· "verified"
··· ],
··· "metadata": {
····· "created": "2024-01-15"
··· }
· },
· {
··· "id": 2,
··· "profile": {
····· "name": "Henry",
····· "location": {
······· "city": "London",
······· "country": "UK"
... (truncated)
JSON (min)
chars: 760 tokens: 224 chars_og/tok: 5.9 enc_chars/tok: 3.4
[{"id":1,"profile":{"name":"Grace","location":{"city":"NYC","country":"USA"}},"tags":["admin","verified"],"metadata":{"created":"2024-01-15"}},{"id":2,"profile":{"name":"Henry","location":{"city":"London","country":"UK"}},"tags":["user"],"metadata":{"created":"2024-02-20","updated":"2024-03-10"}},{"id":3,"profile":{"name":"Ivy","location":{"city":"Tokyo","country":"Japan"}},"tags":["moderator","verified","premium"],"metadata":{"created":"2024-01-05"}},{"id":4,"profile":{"name":"Jack","location":{"city":"Sydney","country":"Australia"}},"tags":["user","new"],"metadata":{"created":"2024-04-01"}},{"id":5,"profile":{"name":"Kate","location":{"city":"Berlin","country":"Germany"}},"tags":["admin"],"metadata":{"created":"2023-12-01","updated":"2024-02-15"}}]
CSV: N/A
TSV: N/A
YAML
chars: 818 tokens: 374 chars_og/tok: 3.5 enc_chars/tok: 2.2
- id: 1
· metadata:
··· created: '2024-01-15'
· profile:
··· location:
····· city: NYC
····· country: USA
··· name: Grace
· tags:
· - admin
· - verified
- id: 2
· metadata:
··· created: '2024-02-20'
··· updated: '2024-03-10'
· profile:
··· location:
····· city: London
····· country: UK
··· name: Henry
· tags:
· - user
- id: 3
· metadata:
··· created: '2024-01-05'
... (truncated)
TOON
chars: 881 tokens: 434 chars_og/tok: 3.0 enc_chars/tok: 2.0
[5]:
· - id: 1
··· profile:
····· name: Grace
····· location:
······· city: NYC
······· country: USA
··· tags[2]: admin,verified
··· metadata:
····· created: 2024-01-15
· - id: 2
··· profile:
····· name: Henry
····· location:
······· city: London
······· country: UK
··· tags[1]: user
··· metadata:
····· created: 2024-02-20
····· updated: 2024-03-10
· - id: 3
··· profile:
····· name: Ivy
····· location:
······· city: Tokyo
... (truncated)
TSON
chars: 453 tokens: 207 chars_og/tok: 6.4 enc_chars/tok: 2.2
{@id,profile(@name,location),tags,metadata#5|1,{Grace,{@city,country|NYC,USA}},[admin,verified],{@created|2024-01-15}|2,{Henry,{@city,country|London,UK}},[user],{@created,updated|2024-02-20,2024-03-10}|3,{Ivy,{@city,country|Tokyo,Japan}},[moderator,verified,premium],{@created|2024-01-05}|4,{Jack,{@city,country|Sydney,Australia}},[user,new],{@created|2024-04-01}|5,{Kate,{@city,country|Berlin,Germany}},[admin],{@created,updated|2023-12-01,2024-02-15}}
minemizer
chars: 403 tokens: 157 chars_og/tok: 8.4 enc_chars/tok: 2.6
id; profile{ name; location{ city; country}}; tags[]; metadata{ created; ...}
1;{ Grace;{ NYC; USA}};[ admin; verified];{ 2024-01-15}
2;{ Henry;{ London; UK}};[ user];{ 2024-02-20; updated: 2024-03-10}
3;{ Ivy;{ Tokyo; Japan}};[ moderator; verified; premium];{ 2024-01-05}
4;{ Jack;{ Sydney; Australia}};[ user; new];{ 2024-04-01}
5;{ Kate;{ Berlin; Germany}};[ admin];{ 2023-12-01; updated: 2024-02-15}
minemizer (compact)
chars: 361 tokens: 173 chars_og/tok: 7.6 enc_chars/tok: 2.1
id;profile{name;location{city;country}};tags[];metadata{created;...}
1;{Grace;{NYC;USA}};[admin;verified];{2024-01-15}
2;{Henry;{London;UK}};[user];{2024-02-20;updated:2024-03-10}
3;{Ivy;{Tokyo;Japan}};[moderator;verified;premium];{2024-01-05}
4;{Jack;{Sydney;Australia}};[user;new];{2024-04-01}
5;{Kate;{Berlin;Germany}};[admin];{2023-12-01;updated:2024-02-15}
books.json — Original: 27902 chars — Tokenizer: gpt2 (openai-community/gpt2)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)27,90212,1882.32.3
JSON (min)22,5017,1033.93.2
CSV14,0715,3545.22.6
TSV14,0575,5645.02.5
YAML22,4008,0813.52.8
TOON14,2775,3885.22.6
TSON14,4485,4335.12.7
minemizer14,4585,1525.42.8
minemizer (compact)13,7535,2605.32.6
JSON (pretty)
chars: 27,902 tokens: 12,188 chars_og/tok: 2.3 enc_chars/tok: 2.3
[
· {
··· "author": "Chinua Achebe",
··· "country": "Nigeria",
··· "imageLink": "images/things-fall-apart.jpg",
··· "language": "English",
··· "link": "https://en.wikipedia.org/wiki/Things_Fall_Apart\n",
··· "pages": 209,
··· "title": "Things Fall Apart",
··· "year": 1958
· },
· {
··· "author": "Hans Christian Andersen",
··· "country": "Denmark",
··· "imageLink": "images/fairy-tales.jpg",
··· "language": "Danish",
··· "link": "https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.\n",
··· "pages": 784,
··· "title": "Fairy tales",
··· "year": 1836
· },
· {
··· "author": "Dante Alighieri",
··· "country": "Italy",
··· "imageLink": "images/the-divine-comedy.jpg",
... (truncated)
JSON (min)
chars: 22,501 tokens: 7,103 chars_og/tok: 3.9 enc_chars/tok: 3.2
[{"author":"Chinua Achebe","country":"Nigeria","imageLink":"images/things-fall-apart.jpg","language":"English","link":"https://en.wikipedia.org/wiki/Things_Fall_Apart\n","pages":209,"title":"Things Fall Apart","year":1958},{"author":"Hans Christian Andersen","country":"Denmark","imageLink":"images/fairy-tales.jpg","language":"Danish","link":"https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.\n","pages":784,"title":"Fairy tales","year":1836},{"author":"Dante Alighieri","country":"Italy","imageLink":"images/the-divine-comedy.jpg","language":"Italian","link":"https://en.wikipedia.org/wiki/Divine_Comedy\n","pages":928,"title":"The Divine Comedy","year":1315},{"author":"Unknown","country":"Sumer and Akkadian Empire","imageLink":"images/the-epic-of-gilgamesh.jpg","language":"Akkadian","link":"https://en.wikipedia.org/wiki/Epic_of_Gilgamesh\n","pages":160,"title":"The Epic Of Gilgamesh","year":-1700},{"author":"Unknown","country":"Achaemenid Empire","imageLink":"images/the-book-of-job.jpg","language":"Hebrew","link":"https://en.wikipedia.org/wiki/Book_of_Job\n","pages":176,"title":"The Book Of Job","year":-600},{"author":"Unknown","country":"India/Iran/Iraq/Egypt/Tajikistan","imageLink":"images/one-thousand-and-one-nights.jpg","language":"Arabic","link":"https://en.wikipedia.org/wiki/One_Thousand_and_One_Nights\n","pages":288,"title":"One Thousand and One Nights","year":1200},{"author":"Unknown","country":"Iceland","imageLink":"images/njals-saga.jpg","language":"Old Norse","link":"https://en.wikipedia.org/wiki/Nj%C3%A1ls_saga\n","pages":384,"title":"Nj\u00e1l's Saga","year":1350},{"author":"Jane Austen","country":"United Kingdom","imageLink":"images/pride-and-prejudice.jpg","language":"English","link":"https://en.wikipedia.org/wiki/Pride_and_Prejudice\n","pages":226,"title":"Pride and Prejudice","year":1813},{"author":"Honor\u00e9 de Balzac","country":"France","imageLink":"images/le-pere-goriot.jpg","language":"French","link":"https://en.wikipedia.org/wiki/Le_P%C3%A8re_Goriot\n","pages":443,"title":"Le P\u00e8re Goriot","year":1835},{"author":"Samuel Beckett","country":"Republic of Ireland","imageLink":"images/molloy-malone-dies-the-unnamable.jpg","language":"French, English","link":"https://en.wikipedia.org/wiki/Molloy_(novel)\n","pages":256,"title":"Molloy, Malone Dies, The Unnamable, the trilogy","year":1952},{"author":"Giovanni Boccaccio","country":"Italy","imageLink":"images/the-decameron.jpg","language":"Italian","link":"https://en.wikipedia.org/wiki/The_Decameron\n","pages":1024,"title":"The Decameron","year":1351},{"author":"Jorge Luis Borges","country":"Argentina","imageLink":"images/ficciones.jpg","language":"Spanish","link":"https://en.wikipedia.org/wiki/Ficciones\n","pages":224,"title":"Ficciones","year":1965},{"author":"Emily Bront\u00eb","country":"United Kingdom","imageLink":"images/wuthering-heights.jpg","language":"English","link":"https://en.wikipedia.org/wiki/Wuthering_Heights\n","pages":342,"title":"Wuthering Heights","year":1847},{"author":"Albert Camus","country":"Algeria, French Empire","imageLink":"images/l-etranger.jpg","language":"French","link":"https://en.wikipedia.org/wiki/The_Stranger_(novel)\n","pages":185,"title":"The Stranger","year":1942},{"author":"Paul Celan","country":"Romania, France","imageLink":"images/poems-paul-celan.jpg","language":"German","link":"\n","pages":320,"title":"Poems","year":1952},{"author":"Louis-Ferdinand C\u00e9line","country":"France","imageLink":"images/voyage-au-bout-de-la-nuit.jpg","language":"French","link":"https://en.wikipedia.org/wiki/Journey_to_the_End_of_the_Night\n","pages":505,"title":"Journey to the End of the Night","year":1932},{"author":"Miguel de Cervantes","country":"Spain","imageLink":"images/don-quijote-de-la-mancha.jpg","language":"Spanish","link":"https://en.wikipedia.org/wiki/Don_Quixote\n","pages":1056,"title":"Don Quijote De La Mancha","year":1610},{"author":"Geoffrey Chaucer","country":"England","imageLink":"images/the-canterbury-tales.jpg","language":"English","link":"https://en.wikipedia.org/wiki/The_Canterbury_Tales\n","pages":544,"title":"The Canterbury Tales","year":1450},{"author":"Anton Chekhov","country":"Russia","imageLink":"images/stories-of-anton-chekhov.jpg","language":"Russian","link":"https://en.wikipedia.org/wiki/List_of_short_stories_by_Anton_Chekhov\n","pages":194,"title":"Stories","year":1886},{"author":"Joseph Conrad","country":"United Kingdom","imageLink":"images/nostromo.jpg","language":"English","link":"https://en.wikipedia.org/wiki/Nostromo\n","pages":320,"title":"Nostromo","year":1904},{"author":"Charles Dickens","country":"United Kingdom","imageLink":"images/great-expectations.jpg","language":"English","link":"https://en.wikipedia.org/wiki/Great_Expectations\n","pages":194,"title":"Great Expectations","year":1861},{"author":"Denis Diderot","country":"France","imageLink":"images/jacques-the-fatalist.jpg","language":"French","link":"https://en.wikipedia.org/wiki/Jacques_the_Fatalis
... (truncated)
CSV
chars: 14,071 tokens: 5,354 chars_og/tok: 5.2 enc_chars/tok: 2.6
author,country,imageLink,language,link,pages,title,year
Chinua Achebe,Nigeria,images/things-fall-apart.jpg,English,"https://en.wikipedia.org/wiki/Things_Fall_Apart
",209,Things Fall Apart,1958
Hans Christian Andersen,Denmark,images/fairy-tales.jpg,Danish,"https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.
",784,Fairy tales,1836
Dante Alighieri,Italy,images/the-divine-comedy.jpg,Italian,"https://en.wikipedia.org/wiki/Divine_Comedy
",928,The Divine Comedy,1315
Unknown,Sumer and Akkadian Empire,images/the-epic-of-gilgamesh.jpg,Akkadian,"https://en.wikipedia.org/wiki/Epic_of_Gilgamesh
",160,The Epic Of Gilgamesh,-1700
Unknown,Achaemenid Empire,images/the-book-of-job.jpg,Hebrew,"https://en.wikipedia.org/wiki/Book_of_Job
",176,The Book Of Job,-600
Unknown,India/Iran/Iraq/Egypt/Tajikistan,images/one-thousand-and-one-nights.jpg,Arabic,"https://en.wikipedia.org/wiki/One_Thousand_and_One_Nights
",288,One Thousand and One Nights,1200
Unknown,Iceland,images/njals-saga.jpg,Old Norse,"https://en.wikipedia.org/wiki/Nj%C3%A1ls_saga
",384,Njál's Saga,1350
Jane Austen,United Kingdom,images/pride-and-prejudice.jpg,English,"https://en.wikipedia.org/wiki/Pride_and_Prejudice
",226,Pride and Prejudice,1813
Honoré de Balzac,France,images/le-pere-goriot.jpg,French,"https://en.wikipedia.org/wiki/Le_P%C3%A8re_Goriot
",443,Le Père Goriot,1835
Samuel Beckett,Republic of Ireland,images/molloy-malone-dies-the-unnamable.jpg,"French, English","https://en.wikipedia.org/wiki/Molloy_(novel)
",256,"Molloy, Malone Dies, The Unnamable, the trilogy",1952
Giovanni Boccaccio,Italy,images/the-decameron.jpg,Italian,"https://en.wikipedia.org/wiki/The_Decameron
",1024,The Decameron,1351
Jorge Luis Borges,Argentina,images/ficciones.jpg,Spanish,"https://en.wikipedia.org/wiki/Ficciones
",224,Ficciones,1965
... (truncated)
TSV
chars: 14,057 tokens: 5,564 chars_og/tok: 5.0 enc_chars/tok: 2.5
authorcountryimageLinklanguagelinkpagestitleyear
Chinua AchebeNigeriaimages/things-fall-apart.jpgEnglish"https://en.wikipedia.org/wiki/Things_Fall_Apart
"209Things Fall Apart1958
Hans Christian AndersenDenmarkimages/fairy-tales.jpgDanish"https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.
"784Fairy tales1836
Dante AlighieriItalyimages/the-divine-comedy.jpgItalian"https://en.wikipedia.org/wiki/Divine_Comedy
"928The Divine Comedy1315
UnknownSumer and Akkadian Empireimages/the-epic-of-gilgamesh.jpgAkkadian"https://en.wikipedia.org/wiki/Epic_of_Gilgamesh
"160The Epic Of Gilgamesh-1700
UnknownAchaemenid Empireimages/the-book-of-job.jpgHebrew"https://en.wikipedia.org/wiki/Book_of_Job
"176The Book Of Job-600
UnknownIndia/Iran/Iraq/Egypt/Tajikistanimages/one-thousand-and-one-nights.jpgArabic"https://en.wikipedia.org/wiki/One_Thousand_and_One_Nights
"288One Thousand and One Nights1200
UnknownIcelandimages/njals-saga.jpgOld Norse"https://en.wikipedia.org/wiki/Nj%C3%A1ls_saga
"384Njál's Saga1350
Jane AustenUnited Kingdomimages/pride-and-prejudice.jpgEnglish"https://en.wikipedia.org/wiki/Pride_and_Prejudice
"226Pride and Prejudice1813
Honoré de BalzacFranceimages/le-pere-goriot.jpgFrench"https://en.wikipedia.org/wiki/Le_P%C3%A8re_Goriot
"443Le Père Goriot1835
Samuel BeckettRepublic of Irelandimages/molloy-malone-dies-the-unnamable.jpgFrench, English"https://en.wikipedia.org/wiki/Molloy_(novel)
"256Molloy, Malone Dies, The Unnamable, the trilogy1952
Giovanni BoccaccioItalyimages/the-decameron.jpgItalian"https://en.wikipedia.org/wiki/The_Decameron
"1024The Decameron1351
Jorge Luis BorgesArgentinaimages/ficciones.jpgSpanish"https://en.wikipedia.org/wiki/Ficciones
"224Ficciones1965
... (truncated)
YAML
chars: 22,400 tokens: 8,081 chars_og/tok: 3.5 enc_chars/tok: 2.8
- author: Chinua Achebe
· country: Nigeria
· imageLink: images/things-fall-apart.jpg
· language: English
· link: 'https://en.wikipedia.org/wiki/Things_Fall_Apart↵↵
··· '
· pages: 209
· title: Things Fall Apart
· year: 1958
- author: Hans Christian Andersen
· country: Denmark
· imageLink: images/fairy-tales.jpg
· language: Danish
· link: 'https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.↵↵
··· '
· pages: 784
· title: Fairy tales
· year: 1836
- author: Dante Alighieri
· country: Italy
· imageLink: images/the-divine-comedy.jpg
· language: Italian
· link: 'https://en.wikipedia.org/wiki/Divine_Comedy
... (truncated)
TOON
chars: 14,277 tokens: 5,388 chars_og/tok: 5.2 enc_chars/tok: 2.6
[100]{author,country,imageLink,language,link,pages,title,year}:
· Chinua Achebe,Nigeria,images/things-fall-apart.jpg,English,"https://en.wikipedia.org/wiki/Things_Fall_Apart\n",209,Things Fall Apart,1958
· Hans Christian Andersen,Denmark,images/fairy-tales.jpg,Danish,"https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.\n",784,Fairy tales,1836
· Dante Alighieri,Italy,images/the-divine-comedy.jpg,Italian,"https://en.wikipedia.org/wiki/Divine_Comedy\n",928,The Divine Comedy,1315
· Unknown,Sumer and Akkadian Empire,images/the-epic-of-gilgamesh.jpg,Akkadian,"https://en.wikipedia.org/wiki/Epic_of_Gilgamesh\n",160,The Epic Of Gilgamesh,-1700
· Unknown,Achaemenid Empire,images/the-book-of-job.jpg,Hebrew,"https://en.wikipedia.org/wiki/Book_of_Job\n",176,The Book Of Job,-600
· Unknown,India/Iran/Iraq/Egypt/Tajikistan,images/one-thousand-and-one-nights.jpg,Arabic,"https://en.wikipedia.org/wiki/One_Thousand_and_One_Nights\n",288,One Thousand and One Nights,1200
· Unknown,Iceland,images/njals-saga.jpg,Old Norse,"https://en.wikipedia.org/wiki/Nj%C3%A1ls_saga\n",384,Njál's Saga,1350
· Jane Austen,United Kingdom,images/pride-and-prejudice.jpg,English,"https://en.wikipedia.org/wiki/Pride_and_Prejudice\n",226,Pride and Prejudice,1813
· Honoré de Balzac,France,images/le-pere-goriot.jpg,French,"https://en.wikipedia.org/wiki/Le_P%C3%A8re_Goriot\n",443,Le Père Goriot,1835
· Samuel Beckett,Republic of Ireland,images/molloy-malone-dies-the-unnamable.jpg,"French, English","https://en.wikipedia.org/wiki/Molloy_(novel)\n",256,"Molloy, Malone Dies, The Unnamable, the trilogy",1952
· Giovanni Boccaccio,Italy,images/the-decameron.jpg,Italian,"https://en.wikipedia.org/wiki/The_Decameron\n",1024,The Decameron,1351
· Jorge Luis Borges,Argentina,images/ficciones.jpg,Spanish,"https://en.wikipedia.org/wiki/Ficciones\n",224,Ficciones,1965
· Emily Brontë,United Kingdom,images/wuthering-heights.jpg,English,"https://en.wikipedia.org/wiki/Wuthering_Heights\n",342,Wuthering Heights,1847
· Albert Camus,"Algeria, French Empire",images/l-etranger.jpg,French,"https://en.wikipedia.org/wiki/The_Stranger_(novel)\n",185,The Stranger,1942
· Paul Celan,"Romania, France",images/poems-paul-celan.jpg,German,"\n",320,Poems,1952
· Louis-Ferdinand Céline,France,images/voyage-au-bout-de-la-nuit.jpg,French,"https://en.wikipedia.org/wiki/Journey_to_the_End_of_the_Night\n",505,Journey to the End of the Night,1932
· Miguel de Cervantes,Spain,images/don-quijote-de-la-mancha.jpg,Spanish,"https://en.wikipedia.org/wiki/Don_Quixote\n",1056,Don Quijote De La Mancha,1610
· Geoffrey Chaucer,England,images/the-canterbury-tales.jpg,English,"https://en.wikipedia.org/wiki/The_Canterbury_Tales\n",544,The Canterbury Tales,1450
· Anton Chekhov,Russia,images/stories-of-anton-chekhov.jpg,Russian,"https://en.wikipedia.org/wiki/List_of_short_stories_by_Anton_Chekhov\n",194,Stories,1886
· Joseph Conrad,United Kingdom,images/nostromo.jpg,English,"https://en.wikipedia.org/wiki/Nostromo\n",320,Nostromo,1904
· Charles Dickens,United Kingdom,images/great-expectations.jpg,English,"https://en.wikipedia.org/wiki/Great_Expectations\n",194,Great Expectations,1861
· Denis Diderot,France,images/jacques-the-fatalist.jpg,French,"https://en.wikipedia.org/wiki/Jacques_the_Fatalist\n",596,Jacques the Fatalist,1796
· Alfred Döblin,Germany,images/berlin-alexanderplatz.jpg,German,"https://en.wikipedia.org/wiki/Berlin_Alexanderplatz\n",600,Berlin Alexanderplatz,1929
· Fyodor Dostoevsky,Russia,images/crime-and-punishment.jpg,Russian,"https://en.wikipedia.org/wiki/Crime_and_Punishment\n",551,Crime and Punishment,1866
... (truncated)
TSON
chars: 14,448 tokens: 5,433 chars_og/tok: 5.1 enc_chars/tok: 2.7
{@author,country,imageLink,language,link,pages,title,year#100|"Chinua Achebe",Nigeria,images/things-fall-apart.jpg,English,"https://en.wikipedia.org/wiki/Things_Fall_Apart\n",209,"Things Fall Apart",1958|"Hans Christian Andersen",Denmark,images/fairy-tales.jpg,Danish,"https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.\n",784,"Fairy tales",1836|"Dante Alighieri",Italy,images/the-divine-comedy.jpg,Italian,"https://en.wikipedia.org/wiki/Divine_Comedy\n",928,"The Divine Comedy",1315|Unknown,"Sumer and Akkadian Empire",images/the-epic-of-gilgamesh.jpg,Akkadian,"https://en.wikipedia.org/wiki/Epic_of_Gilgamesh\n",160,"The Epic Of Gilgamesh",-1700|Unknown,"Achaemenid Empire",images/the-book-of-job.jpg,Hebrew,"https://en.wikipedia.org/wiki/Book_of_Job\n",176,"The Book Of Job",-600|Unknown,India/Iran/Iraq/Egypt/Tajikistan,images/one-thousand-and-one-nights.jpg,Arabic,"https://en.wikipedia.org/wiki/One_Thousand_and_One_Nights\n",288,"One Thousand and One Nights",1200|Unknown,Iceland,images/njals-saga.jpg,"Old Norse","https://en.wikipedia.org/wiki/Nj%C3%A1ls_saga\n",384,"Njál's Saga",1350|"Jane Austen","United Kingdom",images/pride-and-prejudice.jpg,English,"https://en.wikipedia.org/wiki/Pride_and_Prejudice\n",226,"Pride and Prejudice",1813|"Honoré de Balzac",France,images/le-pere-goriot.jpg,French,"https://en.wikipedia.org/wiki/Le_P%C3%A8re_Goriot\n",443,"Le Père Goriot",1835|"Samuel Beckett","Republic of Ireland",images/molloy-malone-dies-the-unnamable.jpg,"French, English","https://en.wikipedia.org/wiki/Molloy_(novel)\n",256,"Molloy, Malone Dies, The Unnamable, the trilogy",1952|"Giovanni Boccaccio",Italy,images/the-decameron.jpg,Italian,"https://en.wikipedia.org/wiki/The_Decameron\n",1024,"The Decameron",1351|"Jorge Luis Borges",Argentina,images/ficciones.jpg,Spanish,"https://en.wikipedia.org/wiki/Ficciones\n",224,Ficciones,1965|"Emily Brontë","United Kingdom",images/wuthering-heights.jpg,English,"https://en.wikipedia.org/wiki/Wuthering_Heights\n",342,"Wuthering Heights",1847|"Albert Camus","Algeria, French Empire",images/l-etranger.jpg,French,"https://en.wikipedia.org/wiki/The_Stranger_(novel)\n",185,"The Stranger",1942|"Paul Celan","Romania, France",images/poems-paul-celan.jpg,German,"\n",320,Poems,1952|"Louis-Ferdinand Céline",France,images/voyage-au-bout-de-la-nuit.jpg,French,"https://en.wikipedia.org/wiki/Journey_to_the_End_of_the_Night\n",505,"Journey to the End of the Night",1932|"Miguel de Cervantes",Spain,images/don-quijote-de-la-mancha.jpg,Spanish,"https://en.wikipedia.org/wiki/Don_Quixote\n",1056,"Don Quijote De La Mancha",1610|"Geoffrey Chaucer",England,images/the-canterbury-tales.jpg,English,"https://en.wikipedia.org/wiki/The_Canterbury_Tales\n",544,"The Canterbury Tales",1450|"Anton Chekhov",Russia,images/stories-of-anton-chekhov.jpg,Russian,"https://en.wikipedia.org/wiki/List_of_short_stories_by_Anton_Chekhov\n",194,Stories,1886|"Joseph Conrad","United Kingdom",images/nostromo.jpg,English,"https://en.wikipedia.org/wiki/Nostromo\n",320,Nostromo,1904|"Charles Dickens","United Kingdom",images/great-expectations.jpg,English,"https://en.wikipedia.org/wiki/Great_Expectations\n",194,"Great Expectations",1861|"Denis Diderot",France,images/jacques-the-fatalist.jpg,French,"https://en.wikipedia.org/wiki/Jacques_the_Fatalist\n",596,"Jacques the Fatalist",1796|"Alfred Döblin",Germany,images/berlin-alexanderplatz.jpg,German,"https://en.wikipedia.org/wiki/Berlin_Alexanderplatz\n",600,"Berlin Alexanderplatz",1929|"Fyodor Dostoevsky",Russia,images/crime-and-punishment.jpg,Russian,"https://en.wikipedia.org/wiki/Crime_and_Punishment\n",551,"Crime and Punishment",1866|"Fyodor Dostoevsky",Russia,images/the-idiot.jpg,Russian,"https://en.wikipedia.org/wiki/The_Idiot\n",656,"The Idiot",1869|"Fyodor Dostoevsky",Russia,images/the-possessed.jpg,Russian,"https://en.wikipedia.org/wiki/Demons_(Dostoyevsky_novel)\n",768,"The Possessed",1872|"Fyodor Dostoevsky",Russia,images/the-brothers-karamazov.jpg,Russian,"https://en.wikipedia.org/wiki/The_Brothers_Karamazov\n",824,"The Brothers Karamazov",1880|"George Eliot","United Kingdom",images/middlemarch.jpg,English,"https://en.wikipedia.org/wiki/Middlemarch\n",800,Middlemarch,1871|"Ralph Ellison","United States",images/invisible-man.jpg,English,"https://en.wikipedia.org/wiki/Invisible_Man\n",581,"Invisible Man",1952|Euripides,Greece,images/medea.jpg,Greek,"https://en.wikipedia.org/wiki/Medea_(play)\n",104,Medea,-431|"William Faulkner","United States",images/absalom-absalom.jpg,English,"https://en.wikipedia.org/wiki/Absalom,_Absalom!\n",313,"Absalom, Absalom!",1936|"William Faulkner","United States",images/the-sound-and-the-fury.jpg,English,"https://en.wikipedia.org/wiki/The_Sound_and_the_Fury\n",326,"The Sound and the Fury",1929|"Gustave Flaubert",France,images/madame-bovary.jpg,French,"https://en.wikipedia.org/wiki/Madame_Bovary\n",528,"Madame Bovary",1857|"Gustave Flaubert",France,images/l-education-sentimentale.jpg,French,"https://en.wikipedia.org/wiki/Sen
... (truncated)
minemizer
chars: 14,458 tokens: 5,152 chars_og/tok: 5.4 enc_chars/tok: 2.8
author; country; imageLink; language; link; pages; title; year
Chinua Achebe; Nigeria; images/things-fall-apart.jpg; English; https://en.wikipedia.org/wiki/Things_Fall_Apart
; 209; Things Fall Apart; 1958
Hans Christian Andersen; Denmark; images/fairy-tales.jpg; Danish; https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.
; 784; Fairy tales; 1836
Dante Alighieri; Italy; images/the-divine-comedy.jpg; Italian; https://en.wikipedia.org/wiki/Divine_Comedy
; 928; The Divine Comedy; 1315
Unknown; Sumer and Akkadian Empire; images/the-epic-of-gilgamesh.jpg; Akkadian; https://en.wikipedia.org/wiki/Epic_of_Gilgamesh
; 160; The Epic Of Gilgamesh; -1700
Unknown; Achaemenid Empire; images/the-book-of-job.jpg; Hebrew; https://en.wikipedia.org/wiki/Book_of_Job
; 176; The Book Of Job; -600
Unknown; India/Iran/Iraq/Egypt/Tajikistan; images/one-thousand-and-one-nights.jpg; Arabic; https://en.wikipedia.org/wiki/One_Thousand_and_One_Nights
; 288; One Thousand and One Nights; 1200
Unknown; Iceland; images/njals-saga.jpg; Old Norse; https://en.wikipedia.org/wiki/Nj%C3%A1ls_saga
; 384; Njál's Saga; 1350
Jane Austen; United Kingdom; images/pride-and-prejudice.jpg; English; https://en.wikipedia.org/wiki/Pride_and_Prejudice
; 226; Pride and Prejudice; 1813
Honoré de Balzac; France; images/le-pere-goriot.jpg; French; https://en.wikipedia.org/wiki/Le_P%C3%A8re_Goriot
; 443; Le Père Goriot; 1835
Samuel Beckett; Republic of Ireland; images/molloy-malone-dies-the-unnamable.jpg; French, English; https://en.wikipedia.org/wiki/Molloy_(novel)
; 256; Molloy, Malone Dies, The Unnamable, the trilogy; 1952
Giovanni Boccaccio; Italy; images/the-decameron.jpg; Italian; https://en.wikipedia.org/wiki/The_Decameron
; 1024; The Decameron; 1351
Jorge Luis Borges; Argentina; images/ficciones.jpg; Spanish; https://en.wikipedia.org/wiki/Ficciones
; 224; Ficciones; 1965
... (truncated)
minemizer (compact)
chars: 13,753 tokens: 5,260 chars_og/tok: 5.3 enc_chars/tok: 2.6
author;country;imageLink;language;link;pages;title;year
Chinua Achebe;Nigeria;images/things-fall-apart.jpg;English;https://en.wikipedia.org/wiki/Things_Fall_Apart
;209;Things Fall Apart;1958
Hans Christian Andersen;Denmark;images/fairy-tales.jpg;Danish;https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.
;784;Fairy tales;1836
Dante Alighieri;Italy;images/the-divine-comedy.jpg;Italian;https://en.wikipedia.org/wiki/Divine_Comedy
;928;The Divine Comedy;1315
Unknown;Sumer and Akkadian Empire;images/the-epic-of-gilgamesh.jpg;Akkadian;https://en.wikipedia.org/wiki/Epic_of_Gilgamesh
;160;The Epic Of Gilgamesh;-1700
Unknown;Achaemenid Empire;images/the-book-of-job.jpg;Hebrew;https://en.wikipedia.org/wiki/Book_of_Job
;176;The Book Of Job;-600
Unknown;India/Iran/Iraq/Egypt/Tajikistan;images/one-thousand-and-one-nights.jpg;Arabic;https://en.wikipedia.org/wiki/One_Thousand_and_One_Nights
;288;One Thousand and One Nights;1200
Unknown;Iceland;images/njals-saga.jpg;Old Norse;https://en.wikipedia.org/wiki/Nj%C3%A1ls_saga
;384;Njál's Saga;1350
Jane Austen;United Kingdom;images/pride-and-prejudice.jpg;English;https://en.wikipedia.org/wiki/Pride_and_Prejudice
;226;Pride and Prejudice;1813
Honoré de Balzac;France;images/le-pere-goriot.jpg;French;https://en.wikipedia.org/wiki/Le_P%C3%A8re_Goriot
;443;Le Père Goriot;1835
Samuel Beckett;Republic of Ireland;images/molloy-malone-dies-the-unnamable.jpg;French, English;https://en.wikipedia.org/wiki/Molloy_(novel)
;256;Molloy, Malone Dies, The Unnamable, the trilogy;1952
Giovanni Boccaccio;Italy;images/the-decameron.jpg;Italian;https://en.wikipedia.org/wiki/The_Decameron
;1024;The Decameron;1351
Jorge Luis Borges;Argentina;images/ficciones.jpg;Spanish;https://en.wikipedia.org/wiki/Ficciones
;224;Ficciones;1965
... (truncated)
countries.json — Original: 1133948 chars — Tokenizer: gpt2 (openai-community/gpt2)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)1,133,948677,2601.71.7
JSON (min)787,962339,4873.32.3
CSVN/A
TSVN/A
YAML641,939345,5803.31.9
TOON691,140397,3012.91.7
TSON423,383210,0565.42.0
minemizer323,130166,5736.81.9
minemizer (compact)299,485170,8416.61.8
JSON (pretty)
chars: 1,133,948 tokens: 677,260 chars_og/tok: 1.7 enc_chars/tok: 1.7
[
· {
··· "name": {
····· "common": "Aruba",
····· "official": "Aruba",
····· "native": {
······· "nld": {
········· "official": "Aruba",
········· "common": "Aruba"
······· },
······· "pap": {
········· "official": "Aruba",
········· "common": "Aruba"
······· }
····· }
··· },
··· "tld": [
····· ".aw"
··· ],
··· "cca2": "AW",
··· "ccn3": "533",
··· "cca3": "ABW",
··· "cioc": "ARU",
··· "independent": false,
··· "status": "officially-assigned",
... (truncated)
JSON (min)
chars: 787,962 tokens: 339,487 chars_og/tok: 3.3 enc_chars/tok: 2.3
[{"name":{"common":"Aruba","official":"Aruba","native":{"nld":{"official":"Aruba","common":"Aruba"},"pap":{"official":"Aruba","common":"Aruba"}}},"tld":[".aw"],"cca2":"AW","ccn3":"533","cca3":"ABW","cioc":"ARU","independent":false,"status":"officially-assigned","unMember":false,"unRegionalGroup":"","currencies":{"AWG":{"name":"Aruban florin","symbol":"\u0192"}},"idd":{"root":"+2","suffixes":["97"]},"capital":["Oranjestad"],"altSpellings":["AW"],"region":"Americas","subregion":"Caribbean","languages":{"nld":"Dutch","pap":"Papiamento"},"translations":{"ara":{"official":"\u0623\u0631\u0648\u0628\u0627","common":"\u0623\u0631\u0648\u0628\u0627"},"bre":{"official":"Aruba","common":"Aruba"},"ces":{"official":"Aruba","common":"Aruba"},"deu":{"official":"Aruba","common":"Aruba"},"est":{"official":"Aruba","common":"Aruba"},"fin":{"official":"Aruba","common":"Aruba"},"fra":{"official":"Aruba","common":"Aruba"},"hrv":{"official":"Aruba","common":"Aruba"},"hun":{"official":"Aruba","common":"Aruba"},"ita":{"official":"Aruba","common":"Aruba"},"jpn":{"official":"\u30a2\u30eb\u30d0","common":"\u30a2\u30eb\u30d0"},"kor":{"official":"\uc544\ub8e8\ubc14","common":"\uc544\ub8e8\ubc14"},"nld":{"official":"Aruba","common":"Aruba"},"per":{"official":"\u0622\u0631\u0648\u0628\u0627","common":"\u0622\u0631\u0648\u0628\u0627"},"pol":{"official":"Aruba","common":"Aruba"},"por":{"official":"Aruba","common":"Aruba"},"rus":{"official":"\u0410\u0440\u0443\u0431\u0430","common":"\u0410\u0440\u0443\u0431\u0430"},"slk":{"official":"Aruba","common":"Aruba"},"spa":{"official":"Aruba","common":"Aruba"},"srp":{"official":"Aruba","common":"Aruba"},"swe":{"official":"Aruba","common":"Aruba"},"tur":{"official":"Aruba","common":"Aruba"},"urd":{"official":"\u0627\u0631\u0648\u0628\u0627","common":"\u0627\u0631\u0648\u0628\u0627"},"zho":{"official":"\u963f\u9c81\u5df4","common":"\u963f\u9c81\u5df4"}},"latlng":[12.5,-69.96666666],"landlocked":false,"borders":[],"area":180,"flag":"\ud83c\udde6\ud83c\uddfc","demonyms":{"eng":{"f":"Aruban","m":"Aruban"},"fra":{"f":"Arubaise","m":"Arubais"}}},{"name":{"common":"Afghanistan","official":"Islamic Republic of Afghanistan","native":{"prs":{"official":"\u062c\u0645\u0647\u0648\u0631\u06cc \u0627\u0633\u0644\u0627\u0645\u06cc \u0627\u0641\u063a\u0627\u0646\u0633\u062a\u0627\u0646","common":"\u0627\u0641\u063a\u0627\u0646\u0633\u062a\u0627\u0646"},"pus":{"official":"\u062f \u0627\u0641\u063a\u0627\u0646\u0633\u062a\u0627\u0646 \u0627\u0633\u0644\u0627\u0645\u064a \u062c\u0645\u0647\u0648\u0631\u06cc\u062a","common":"\u0627\u0641\u063a\u0627\u0646\u0633\u062a\u0627\u0646"},"tuk":{"official":"Owganystan Yslam Respublikasy","common":"Owganystan"}}},"tld":[".af"],"cca2":"AF","ccn3":"004","cca3":"AFG","cioc":"AFG","independent":true,"status":"officially-assigned","unMember":true,"unRegionalGroup":"Asia and the Pacific Group","currencies":{"AFN":{"name":"Afghan afghani","symbol":"\u060b"}},"idd":{"root":"+9","suffixes":["3"]},"capital":["Kabul"],"altSpellings":["AF","Af\u0121\u0101nist\u0101n"],"region":"Asia","subregion":"Southern Asia","languages":{"prs":"Dari","pus":"Pashto","tuk":"Turkmen"},"translations":{"ara":{"official":"\u062c\u0645\u0647\u0648\u0631\u064a\u0629 \u0623\u0641\u0641\u0627\u0646\u0633\u062a\u0627\u0646 \u0627\u0644\u0625\u0633\u0644\u0627\u0645\u064a\u0629","common":"\u0623\u0641\u063a\u0627\u0646\u0633\u062a\u0627\u0646"},"bre":{"official":"Republik Islamek Afghanistan","common":"Afghanistan"},"ces":{"official":"Afgh\u00e1nsk\u00e1 isl\u00e1msk\u00e1 republika","common":"Afgh\u00e1nist\u00e1n"},"deu":{"official":"Islamische Republik Afghanistan","common":"Afghanistan"},"est":{"official":"Afganistani Islamivabariik","common":"Afganistan"},"fin":{"official":"Afganistanin islamilainen tasavalta","common":"Afganistan"},"fra":{"official":"R\u00e9publique islamique d'Afghanistan","common":"Afghanistan"},"hrv":{"official":"Islamska Republika Afganistan","common":"Afganistan"},"hun":{"official":"Afganiszt\u00e1ni Iszl\u00e1m K\u00f6zt\u00e1rsas\u00e1g","common":"Afganiszt\u00e1n"},"ita":{"official":"Repubblica islamica dell'Afghanistan","common":"Afghanistan"},"jpn":{"official":"\u30a2\u30d5\u30ac\u30cb\u30b9\u30bf\u30f3\u30fb\u30a4\u30b9\u30e9\u30e0\u5171\u548c\u56fd","common":"\u30a2\u30d5\u30ac\u30cb\u30b9\u30bf\u30f3"},"kor":{"official":"\uc544\ud504\uac00\ub2c8\uc2a4\ud0c4 \uc774\uc2ac\ub78c \uacf5\ud654\uad6d","common":"\uc544\ud504\uac00\ub2c8\uc2a4\ud0c4"},"nld":{"official":"Islamitische Republiek Afghanistan","common":"Afghanistan"},"per":{"official":"\u062c\u0645\u0647\u0648\u0631\u06cc \u0627\u0633\u0644\u0627\u0645\u06cc \u0627\u0641\u063a\u0627\u0646\u0633\u062a\u0627\u0646","common":"\u0627\u0641\u063a\u0627\u0646\u0633\u062a\u0627\u0646"},"pol":{"official":"Islamska Republika Afganistanu","common":"Afganistan"},"por":{"official":"Rep\u00fablica Isl\u00e2mica do Afeganist\u00e3o","common":"Afeganist\u00e3o"},"rus":{"official":"\u0418\u0441\u043b\u0430\u043c\u0441\u043a\u0430\u044f \u0420\
... (truncated)
CSV: N/A
TSV: N/A
YAML
chars: 641,939 tokens: 345,580 chars_og/tok: 3.3 enc_chars/tok: 1.9
- altSpellings:
· - AW
· area: 180
· borders: []
· capital:
· - Oranjestad
· cca2: AW
· cca3: ABW
· ccn3: '533'
· cioc: ARU
· currencies:
··· AWG:
····· name: Aruban florin
····· symbol:·
· demonyms:
··· eng:
····· f: Aruban
····· m: Aruban
··· fra:
····· f: Arubaise
····· m: Arubais
· flag:
··idd:
··· root: '+2'
··· suffixes:
... (truncated)
TOON
chars: 691,140 tokens: 397,301 chars_og/tok: 2.9 enc_chars/tok: 1.7
[250]:
· -
··· name:
····· common: Aruba
····· official: Aruba
····· native:
······· nld:
········· official: Aruba
········· common: Aruba
······· pap:
········· official: Aruba
········· common: Aruba
··· tld[1]: .aw
··· cca2: AW
··· ccn3: "533"
··· cca3: ABW
··· cioc: ARU
··· independent: false
··· status: officially-assigned
··· unMember: false
··· unRegionalGroup: ""
··· currencies:
····· AWG:
······· name: Aruban florin
······· symbol:·
... (truncated)
TSON
chars: 423,383 tokens: 210,056 chars_og/tok: 5.4 enc_chars/tok: 2.0
{@name(@common,official,native),tld,cca2,ccn3,cca3,cioc,independent,status,unMember,unRegionalGroup,currencies,idd(@root,suffixes),capital,altSpellings,region,subregion,languages,translations(@ara,bre,ces,deu,est,fin,fra,hrv,hun,ita,jpn,kor,nld,per,pol,por,rus,slk,spa,srp,swe,tur,urd,zho),latlng,landlocked,borders,area,flag,demonyms(@eng,fra)#250|{Aruba,Aruba,{@nld,pap|{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba}}},[.aw],AW,"533",ABW,ARU,false,officially-assigned,false,"",{@AWG|{@name,symbol|"Aruban florin",}},{"+2",["97"]},[Oranjestad],[AW],Americas,Caribbean,{@nld,pap|Dutch,Papiamento},{{@official,common|روبا,روبا},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|アル,アル},{@official,common|,},{@official,common|Aruba,Aruba},{@official,common|روبا,روبا},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|руа,руа},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|اروبا,اروبا},{@official,common|,}},[12.5,-69.96666666],false,[],180,,{{@f,m|Aruban,Aruban},{@f,m|Arubaise,Arubais}}|{Afghanistan,"Islamic Republic of Afghanistan",{@prs,pus,tuk|{@official,common|"مهور·ا�لام·اانستان",اانستان},{@official,common|"د·اانستان·ا�لاميمهورت",اانستان},{@official,common|"Owganystan Yslam Respublikasy",Owganystan}}},[.af],AF,"004",AFG,AFG,true,officially-assigned,true,"Asia and the Pacific Group",{@AFN|{@name,symbol|"Afghan afghani",}},{"+9",["3"]},[Kabul],[AF,Afānistān],Asia,"Southern Asia",{@prs,pus,tuk|Dari,Pashto,Turkmen},{{@official,common|"مهوريةانستان السلامية",انستان},{@official,common|"Republik Islamek Afghanistan",Afghanistan},{@official,common|"Afghánská islámská republika",Afghánistán},{@official,common|"Islamische Republik Afghanistan",Afghanistan},{@official,common|"Afganistani Islamivabariik",Afganistan},{@official,common|"Afganistanin islamilainen tasavalta",Afganistan},{@official,common|"République islamique d'Afghanistan",Afghanistan},{@official,common|"Islamska Republika Afganistan",Afganistan},{@official,common|"Afganisztáni Iszlám Köztársaság",Afganisztán},{@official,common|"Repubblica islamica dell'Afghanistan",Afghanistan},{@official,common|,},{@official,common|"·",},{@official,common|"Islamitische Republiek Afghanistan",Afghanistan},{@official,common|"مهور·ا�لام·اانستان",اانستان},{@official,common|"Islamska Republika Afganistanu",Afganistan},{@official,common|"República Islâmica do Afeganistão",Afeganistão},{@official,common|"сламскаяесуликаанистан",анистан},{@official,common|"Afgánsky islamsktát",Afganistan},{@official,common|"República Islámica de Afganistán",Afganistán},{@official,common|"Islamska Republika Avganistan",Avganistan},{@official,common|"Islamiska republiken Afghanistan",Afghanistan},{@official,common|"Afganistanslam Cumhuriyeti",Afganistan},{@official,common|"ا�لاممور·اانستان",اانستان},{@official,common|,}},[33,65],true,[IRN,PAK,TKM,UZB,TJK,CHN],652230,,{{@f,m|Afghan,Afghan},{@f,m|Afghane,Afghan}}|{Angola,"Republic of Angola",{@por|{@official,common|"República de Angola",Angola}}},[.ao],AO,"024",AGO,ANG,true,officially-assigned,true,"African Group",{@AOA|{@name,symbol|"Angolan kwanza",Kz}},{"+2",["44"]},[Luanda],[AO,"República de Angola","publika de an'la"],Africa,"Middle Africa",{@por|Portuguese},{{@official,common|نولا,"مهوريةنولا"},{@official,common|"Republik Angola",Angola},{@official,common|"Angolská republika",Angola},{@official,common|"Republik Angola",Angola},{@official,common|"Angola Vabariik",Angola},{@official,common|"Angolan tasavalta",Angola},{@official,common|"République d'Angola",Angola},{@official,common|"Republika Angola",Angola},{@official,common|Angola,Angola},{@official,common|"Repubblica dell'Angola",Angola},{@official,common|,},{@official,common|"·",},{@official,common|"Republiek Angola",Angola},{@official,common|"مهورنولا",نولا},{@official,common|"Republika Angoli",Angola},{@official,common|"República de Angola",Angola},{@official,common|"есуликано�а",но�а},{@official,common|"Angolská republika",Angola},{@official,common|"República de Angola",Angola},{@official,common|"Republika Angola",Angola},{@official,common|"Republiken Angola",Angola},{@official,common|"Angola Cumhuriyeti",Angola},{@official,common|"مور·انول",انول},{@official,common|,}},[-12.5,18.5],false,[COG,COD,ZMB,NAM],1246700,,{{@f,m|Angolan,Angolan},{@f,m|Angolaise,Angolais}}|{Anguilla,Anguilla,{@eng|{@official,common|Anguilla,Anguilla}}},[.ai],AI,"660",AIA,"",false,officially-assigned,false,"",{@XCD
... (truncated)
minemizer
chars: 323,130 tokens: 166,573 chars_og/tok: 6.8 enc_chars/tok: 1.9
name{ common; official; native{ ...}}; tld[]; cca2; ccn3; cca3; cioc; independent; status; unMember; unRegionalGroup; currencies{ ...};·idd{ root; suffixes[]}; capital[]; altSpellings[]; region; subregion; languages{ ...}; translations{ ara{ official; common}; bre{ official; common}; ces{ official; common}; deu{ official; common}; est{ official; common}; fin{ official; common}; fra{ official; common}; hrv{ official; common}; hun{ official; common}; ita{ official; common}; jpn{ official; common}; kor{ official; common}; nld{ official; common}; per{ official; common}; pol{ official; common}; por{ official; common}; rus{ official; common}; slk{ official; common}; spa{ official; common}; srp{ official; common}; swe{ official; common}; tur{ official; common};·urd{ official; common}; zho{ official; common}}; latlng[]; landlocked; borders[]; area; flag; demonyms{ eng{ f; m}; fra{ f; m}}
{ Aruba; Aruba;{ nld:{ official: Aruba; common: Aruba}; pap:{ official: Aruba; common: Aruba}}};[ .aw]; AW; 533; ABW; ARU;false; officially-assigned;false;;{ AWG:{ name: Aruban florin; symbol:·}};{ +2;[ 97]};[ Oranjestad];[ AW]; Americas; Caribbean;{ nld: Dutch; pap: Papiamento};{{روبا;روبا};{ Aruba; Aruba};{ Aruba; Aruba};{ Aruba; Aruba};{ Aruba; Aruba};{ Aruba; Aruba};{ Aruba; Aruba};{ Aruba; Aruba};{ Aruba; Aruba};{ Aruba; Aruba};{·アル;·アル};{;};{ Aruba; Aruba};{روبا;روبا};{ Aruba; Aruba};{ Aruba; Aruba};{руа;руа};{ Aruba; Aruba};{ Aruba; Aruba};{ Aruba; Aruba};{ Aruba; Aruba};{ Aruba; Aruba};{·اروبا;·اروبا};{;}};[ 12.5; -69.96666666];false;[]; 180;;{{ Aruban; Aruban};{ Arubaise; Arubais}}
{ Afghanistan; Islamic Republic of Afghanistan;{ prs:{ official:مهور·ا�لام·اانستان; common:·اانستان}; pus:{ official:·اانستان·ا�لاميمهورت; common:·اانستان}; tuk:{ official: Owganystan Yslam Respublikasy; common: Owganystan}}};[ .af]; AF; 004; AFG; AFG;true; officially-assigned;true; Asia and the Pacific Group;{ AFN:{ name: Afghan afghani; symbol:}};{ +9;[ 3]};[ Kabul];[ AF; Afānistān]; Asia; Southern Asia;{ prs: Dari; pus: Pashto; tuk: Turkmen};{{مهوريةانستان السلامية;انستان};{ Republik Islamek Afghanistan; Afghanistan};{ Afghánská islámská republika; Afghánistán};{ Islamische Republik Afghanistan; Afghanistan};{ Afganistani Islamivabariik; Afganistan};{ Afganistanin islamilainen tasavalta; Afganistan};{publique islamique d'Afghanistan; Afghanistan};{ Islamska Republika Afganistan; Afganistan};{ Afganisztáni Iszlám Köztársaság; Afganisztán};{ Repubblica islamica dell'Afghanistan; Afghanistan};{·;·};{·;};{ Islamitische Republiek Afghanistan; Afghanistan};{مهور·ا�لام·اانستان;·اانستان};{ Islamska Republika Afganistanu; Afganistan};{ República Islâmica do Afeganistão; Afeganistão};{сламскаяесуликаанистан;анистан};{ Afgánsky islamsktát; Afganistan};{ República Islámica de Afganistán; Afganistán};{ Islamska Republika Avganistan; Avganistan};{ Islamiska republiken Afghanistan; Afghanistan};{ Afganistanslam Cumhuriyeti; Afganistan};{·ا�لاممور·اانستان;·اانستان};{;}};[ 33; 65];true;[ IRN; PAK; TKM; UZB; TJK; CHN]; 652230;;{{ Afghan; Afghan};{ Afghane; Afghan}}
{ Angola; Republic of Angola;{ por:{ official: República de Angola; common: Angola}}};[ .ao]; AO; 024; AGO; ANG;true; officially-assigned;true; African Group;{ AOA:{ name: Angolan kwanza; symbol: Kz}};{ +2;[ 44]};[ Luanda];[ AO; República de Angola;·publika de an'la]; Africa; Middle Africa;{ por: Portuguese};{{نولا;مهوريةنولا};{ Republik Angola; Angola};{ Angolská republika; Angola};{ Republik Angola; Angola};{ Angola Vabariik; Angola};{ Angolan tasavalta; Angola};{publique d'Angola; Angola};{ Republika Angola; Angola};{ Angola; Angola};{ Repubblica dell'Angola; Angola};{·;·};{·;};{ Republiek Angola; Angola};{مهورنولا;نولا};{ Republika Angoli; Angola};{ República de Angola; Angola};{есуликано�а;но�а};{ Angolská republika; Angola};{ República de Angola; Angola};{ Republika Angola; Angola};{ Republiken Angola; Angola};{ Angola Cumhuriyeti; Angola};{مور·انول;·انول};{;}};[ -12.5; 18.5];false;[ COG; COD; ZMB; NAM]; 1246700;;{{ Angolan; Angolan};{ Angolaise; Angolais}}
{ Anguilla; Anguilla;{ eng:{ official: Anguilla; common: Anguilla}}};[ .ai]; AI; 660; AIA;;false; officially-assigned;false;;{ XCD:{ name: Eastern Caribbean dollar; symbol: $}};{ +1;[ 264]};[ The Valley];[ AI]; Americas; Caribbean;{ eng: English};{{نويلا;نويلا};{ Anguilla; Anguilla};{ Anguilla; Anguilla};{ Anguilla; Anguilla};{ Anguilla; Anguilla};{ Anguilla; Anguilla};{ Anguilla; Anguilla};{ Anguilla; Angvila};{ Anguilla; Anguilla};{ Anguilla; Anguilla};{·;·};{;};{ Anguilla; Anguilla};{نولا;نولا};{ Anguilla; Anguilla};{ Anguilla; Anguilla};{нилья;нилья};{ Anguilla; Anguilla};{ Anguila; Anguilla};{ Angvila; Angvila};{ Anguilla; Anguilla};{ Anguilla; Anguilla};{·انولا;·انولا};{;}};[ 18.25; -63.16666666];false;[]; 91;;{{ Anguillian; Anguillian};{ Anguillane; Anguillan}}
{land Islands;land Islands;{ swe:{ official: Landskapetland; common:land}}};[ .ax]; AX; 248; ALA;;false; officially-assigned;false;;{ EUR:{ name: Euro; symbol:}};{ +3;[ 5818]};[ Mariehamn];[ AX; Aaland; Aland; Ahvenanmaa]; Europe; Northern Europe;{ swe: Swedish};{{رولاند;رولاند};{ Iniziland;land};{landské ostrovy;landy};{land-Inseln;land};{ Ahvenamaa maakond; Ahvenamaa};{ Ahvenanmaan maakunta; Ahvenanmaa};{ Ahvenanmaa; Ahvenanmaa};{ Aland Islands;landski otoci};{land-szigetek;land-szigetek};{ Isoleland; Isole Aland};{ラン;ラン};{;};{land eilanden;landeilanden};{ار الند;ار الند};{ Wyspy Alandzkie; Wyspy Alandzkie};{ Ilhasland; Alândia};{ландскиестро�а;ландскиестро�а};{ Alandské ostrovy; Alandy};{ Islasland; Alandia};{ Olandska Ostrva; Olandska Ostrva};{land;land};{land Adaları;land};{ا�ر·اولند;ا�ر·اولند};{;}};[ 60.116667; 19.9];false;[]; 1580;;{{landish;landish};{landaise;landais}}
{ Albania; Republic of Albania;{ sqi:{ official: Republika e Shqipërisë; common: Shqipëria}}};[ .al]; AL; 008; ALB; ALB;true; officially-assigned;true; Eastern European Group;{ ALL:{ name: Albanian lek; symbol: L}};{ +3;[ 55]};[ Tirana];[ AL; Shqipëri; Shqipëria; Shqipnia]; Europe; Southeast Europe;{ sqi: Albanian};{{مهوريةلبانيا;لبانيا};{ Republik Albania; Albania};{ Albánská republika; Albánie};{ Republik Albanien; Albanien};{ Albaania Vabariik; Albaania};{ Albanian tasavalta; Albania};{publique d'Albanie; Albanie};{ Republika Albanija; Albanija};{ Albán Köztársaság; Albánia};{ Repubblica d'Albania; Albania};{·アル;·アル};{·;};{ Republiek Albanië; Albanië};{مهورلبان;لبان};{ Republika Albanii; Albania};{ República da Albânia; Albânia};{есуликалания;лания};{ Albánska republika; Albánsko};{ República de Albania; Albania};{ Republika Albanija; Albanija};{ Republiken Albanien; Albanien};{ Arnavutluk Cumhuriyeti; Arnavutluk};{مور البانا; البانا};{;}};[ 41; 20];false;[ MNE; GRC; MKD; UNK]; 28748;;{{ Albanian; Albanian};{ Albanaise; Albanais}}
{ Andorra; Principality of Andorra;{ cat:{ official: Principat d'Andorra; common: Andorra}}};[ .ad]; AD; 020; AND; AND;true; officially-assigned;true; Western European and Others Group;{ EUR:{ name: Euro; symbol:}};{ +3;[ 76]};[ Andorra la Vella];[ AD; Principality of Andorra; Principat d'Andorra]; Europe; Southern Europe;{ cat: Catalan};{{مارةندورا;ندورا};{ Priñselezh Andorra; Andorra};{ Andorrské kníectví; Andorra};{ Fürstentum Andorra; Andorra};{ Andorra Vürstiriik; Andorra};{ Andorran ruhtinaskunta; Andorra};{ Principauté d'Andorre; Andorre};{ Kneevina Andora; Andora};{ Andorra; Andorra};{ Principato di Andorra; Andorra};{·ドラ;·ドラ};{·;};{ Prinsdom Andorra; Andorra};{اها�هننندورا;ندورا};{ Ksistwo Andory; Andora};{ Principado de Andorra; Andorra};{няествондорра;ндорра};{ Andorrské knieatstvo; Andorra};{ Principado de Andorra; Andorra};{ Kneevina Andora; Andora};{ Furstendömet Andorra; Andorra};{ Andorra Prensliği; Andorra};{·امارا�ِ·انورا;·انورا};{;}};[ 42.5; 1.5];true;[ FRA; ESP]; 468;;{{ Andorran; Andorran};{ Andorrane; Andorran}}
{ United Arab Emirates; United Arab Emirates;{ ara:{ official: المارا� العربية المتدة; common: المارا�}}};[ .ae;·امارا�.]; AE; 784; ARE; UAE;true; officially-assigned;true; Asia and the Pacific Group;{ AED:{ name: United Arab Emirates dirham; symbol:.}};{ +9;[ 71]};[ Abu Dhabi];[ AE; UAE; Emirates]; Asia; Western Asia;{ ara: Arabic};{{ المارا� العربية المتدة; المارا�};{ Emirelezhio Arab Unanet; Emirelezhio Arab Unanet};{ Spojené arabské emiráty; Spojené arabské emiráty};{ Vereinigte Arabische Emirate; Vereinigte Arabische Emirate};{ Araabia Ühendemiraadid; Araabia Ühendemiraadid};{ Yhdistyneet arabiemiirikunnat; Arabiemiraatit};{ Émirats arabes unis; Émirats arabes unis};{ Ujedinjeni Arapski Emirati; Ujedinjeni Arapski Emirati};{ Egyesült Arab Emírségek; Egyesült Arab Emírségek};{ Emirati Arabi Uniti; Emirati Arabi Uniti};{·; UAE};{·;};{ Verenigde Arabische Emiraten; Verenigde Arabische Emiraten};{·امارا� متدهرب;·امارا�};{ Zjednoczone Emiraty Arabskie; Zjednoczone Emiraty Arabskie};{ Emiradosrabes Unidos; Emiradosrabes Unidos};{единенныераскиемираты;единнныераскиемираты};{ Spojené arabské emiráty; Spojené arabské emiráty};{ Emiratosrabes Unidos; Emiratosrabes Unidos};{ Ujedinjeni Arapski Emirati; Ujedinjeni Arapski Emirati};{ Förenade Arabemiraten; Förenade Arabemiraten};{ Birleşik Arap Emirlikleri; Birleşik Arap Emirlikleri};{ متدرب·امارا�; متدرب·امارا�};{��;��}};[ 24; 54];false;[ OMN; SAU]; 83600;;{{ Emirati; Emirati};{ Emirienne; Emirien}}
{ Argentina; Argentine Republic;{ grn:{ official: Argentine Republic; common: Argentina}; spa:{ official: República Argentina; common: Argentina}}};[ .ar]; AR; 032; ARG; ARG;true; officially-assigned;true; Latin American and Caribbean Group;{ ARS:{ name: Argentine peso; symbol: $}};{ +5;[ 4]};[ Buenos Aires];[ AR; Argentine Republic; República Argentina]; Americas; South America;{ grn: Guaraní; spa: Spanish};{{مهورية الرنتين; الرنتين};{ Republik Arc'hantina; Arc'hantina};{ Argentinská republika; Argentina};{ Argentinische Republik; Argentinien};{ Argentina Vabariik; Argentina};{ Argentiinan tasavalta; Argentiina};{publique argentine; Argentine};{ Argentinski Republika; Argentina};{ Argentin Köztársaság; Argentína};{ Repubblica Argentina; Argentina};{·アル;·アル};{·;};{ Argentijnse Republiek; Argentinië};{مهوررانتن;رانتن};{ Republika Argentyska; Argentyna};{ República Argentina; Argentina};{рентинскаяесулика;рентина};{ Argentínska republika; Argentína};{ República Argentina; Argentina};{ Republika Argentina; Argentina};{ Republiken Argentina; Argentina};{ Arjantin Cumhuriyeti; Arjantin};{مور·ارنا�ن;·ارنا�ن};{;}};[ -34; -64];false;[ BOL; BRA; CHL; PRY; URY]; 2780400;;{{ Argentine; Argentine};{ Argentine; Argentin}}
{ Armenia; Republic of Armenia;{ hye:{ official:··; common:·}}};[ .am]; AM; 051; ARM; ARM;true; officially-assigned;true; Eastern European Group;{ AMD:{ name: Armenian dram; symbol:·}};{ +3;[ 74]};[ Yerevan];[ AM; Hayastan; Republic of Armenia;··]; Asia; Western Asia;{ hye: Armenian};{{مهوريةرمينيا;رمينيا};{ Republik Armenia; Armenia};{ Arménská republika; Arménie};{ Republik Armenien; Armenien};{ Armeenia Vabariik; Armeenia};{ Armenian tasavalta; Armenia};{publique d'Arménie; Arménie};{ Republika Armenija; Armenija};{ Örményország; Örményország};{ Repubblica di Armenia; Armenia};{·アル;·アル};{·;};{ Republiek Armenië; Armenië};{مهور·ارمنستان;·ارمنستان};{ Republika Armenii; Armenia};{ República da Arménia; Arménia};{есуликармения;рмения};{ Arménska republika; Arménsko};{ República de Armenia; Armenia};{ Republika Jermenija; Jermenija};{ Republiken Armenien; Armenien};{ Ermenistan Cumhuriyeti; Ermenistan};{موررمنا;رمنا};{·;·}};[ 40; 45];true;[ AZE; GEO; IRN; TUR]; 29743;;{{ Armenian; Armenian};{ Arménienne; Arménien}}
{ American Samoa; American Samoa;{ eng:{ official: American Samoa; common: American Samoa}; smo:{ official: Sāmoa Amelika; common: Sāmoa Amelika}}};[ .as]; AS; 016; ASM; ASA;false; officially-assigned;false;;{ USD:{ name: United States dollar; symbol: $}};{ +1;[ 684]};[ Pago Pago];[ AS; Amerika Sāmoa; Amelika Sāmoa; Sāmoa Amelika]; Oceania; Polynesia;{ eng: English; smo: Samoan};{{اموا المريية;اموا المريية};{ Samoa Amerikan; Samoa Amerikan};{ Americká Samoa; Americká Samoa};{ Amerikanisch-Samoa; Amerikanisch-Samoa};{ Ameerika Samoa; Ameerika Samoa};{ Amerikan Samoa; Amerikan Samoa};{ Samoa américaines; Samoa américaines};{ američka Samoa; Američka Samoa};{ Szamoa; Szamoa};{ Samoa americane; Samoa Americane};{;·};{��;��};{ Amerikaans Samoa; Amerikaans Samoa};{امومرا;امومرا};{ Samoa Amerykaskie; Samoa Amerykaskie};{ Samoa americana; Samoa Americana};{мериканскоеамоа;мериканскоеамоа};{ Americká Samoa; Americká Samoa};{ Samoa Americana; Samoa Americana};{ Američka Samoa; Američka Samoa};{ Amerikanska Samoa; Amerikanska Samoa};{ Amerikan Samoası; Amerikan Samoası};{·امرمووا;·امرمووا};{;}};[ -14.33333333; -170];false;[]; 199;;{{ American Samoan; American Samoan};{ Samoane; Samoan}}
{ Antarctica; Antarctica;{}};[ .aq]; AQ; 010; ATA;;false; officially-assigned;false;;{};{;[]};[];[ AQ]; Antarctic;;{};{{نتارتيا;نتارتيا};{ Antarktika; Antarktika};{ Antarktida; Antarktida};{ Antarktika; Antarktis};{ Antarktika; Antarktika};{ Etelämanner; Etelämanner};{ Antarctique; Antarctique};{ Antarktika; Antarktika};{ Antarktisz; Antarktisz};{ Antartide; Antartide};{��;��};{;};{ Antarctica; Antarctica};{نوبان;نوبان};{ Antarktyka; Antarktyka};{ Antártica; Antártida};{нтарктида;нтарктида};{ Antarktída; Antarktída};{ Antártida; Antártida};{ Antarktik; Antarktik};{ Antarktis; Antarktis};{ Antarktika; Antarktika};{·انارا;·انارا};{;}};[ -90; 0];false;[]; 14000000;;{{ Antarctican; Antarctican};{ Antarcticaine; Antarcticain}}
{ French Southern and Antarctic Lands; Territory of the French Southern and Antarctic Lands;{ fra:{ official: Territoire des Terres australes et antarctiques françaises; common: Terres australes et antarctiques françaises}}};[ .tf]; TF; 260; ATF;;false; officially-assigned;false;;{ EUR:{ name: Euro; symbol:}};{ +2;[ 62]};[ Port-aux-Français];[ TF; French Southern Territories]; Antarctic;;{ fra: French};{{ ما�عا� واليم ما ورا� البار الرنسية;را�رنسيةنوبية ونتارتيية};{ Tiriad Douaro Aostral hag Antarktikel Frañs; Douaro Aostral hag Antarktikel Frañs};{ Teritorium Francouzská jiní a antarktickázemí; Francouzská jiní a antarktickázemí};{ Gebiet der Französisch Süd- und Antarktisgebiete; Französische Süd- und Antarktisgebiete};{ Prantsuse Lunaalad; Prantsuse Lunaalad};{ Ranskan eteläiset ja antarktiset alueet; Ranskan eteläiset ja antarktiset alueet};{ Territoire des Terres australes et antarctiques françaises; Terres australes et antarctiques françaises};{ Teritoriju Francuski juni i antarktički teritoriji; Francuski juni i antarktički teritoriji};{ Franciali·és antarktiszi területek; Franciali·és antarktiszi területek};{ Territorio della australi e antartiche francesi Terre; Territori Francesi del Sud};{ラン��;ラン��};{·;·};{ Grondgebied van de Franse Zuidelijke en Antarctische gebieden; Franse Gebieden in de zuidelijke Indische Oceaan};{رمنهانوب ونوبانرانسه;رمنهانوب ونوبانرانسه};{ Francuskie Terytoria Południowe i Antarktyczne; Francuskie Terytoria Południowe i Antarktyczne};{ Território do Sul e Antártica Francesa; Terras Austrais e Antárticas Francesas};{ерриторияранускиеныентарктиескиеемли;ранускиеныентарктиеские·территории};{ Francúzske juné a antarktickézemia; Francúzske juné a antarktickézemia};{ Territorio del Francés Tierras australes y antárticas; Tierras Australes y Antárticas Francesas};{ Francuske june i antarktičke zemlje; Francuske june i antarktičke zemlje};{ Franska syd- och Antarktisterritorierna; Franska södra territorierna};{ Fransız Güney ve Antarktika Toprakları; Fransız Güney ve Antarktika Toprakları};{رمنِنوبرانسس و·انار;رمننوبرانسس و·انارا};{;}};[ -49.25; 69.167];false;[]; 7747;;{{ French; French};{ Française; Français}}
{ Antigua and Barbuda; Antigua and Barbuda;{ eng:{ official: Antigua and Barbuda; common: Antigua and Barbuda}}};[ .ag]; AG; 028; ATG; ANT;true; officially-assigned;true; Latin American and Caribbean Group;{ XCD:{ name: Eastern Caribbean dollar; symbol: $}};{ +1;[ 268]};[ Saint John's];[ AG]; Americas; Caribbean;{ eng: English};{{نتيوا وباربودا;نتيوا وباربودا};{ Antigua ha Barbuda; Antigua ha Barbuda};{ Antigua a Barbuda; Antigua a Barbuda};{ Antigua und Barbuda; Antigua und Barbuda};{ Antigua ja Barbuda; Antigua ja Barbuda};{ Antigua ja Barbuda; Antigua ja Barbuda};{ Antigua -et-Barbuda; Antigua-et-Barbuda};{ Antigva i Barbuda; Antigva i Barbuda};{ Antigua·és Barbuda; Antigua·és Barbuda};{ Antigua e Barbuda; Antigua e Barbuda};{·ティー�ー�;·ティー�ー�};{;};{ Antigua en Barbuda; Antigua en Barbuda};{نتوا واربودا;نتوا واربودا};{ Antigua i Barbuda; Antigua i Barbuda};{ Antigua e Barbuda; Antígua e Barbuda};{нтиуааруда;нтиуааруда};{ Antigua a Barbuda; Antigua a Barbuda};{ Antigua y Barbuda; Antigua y Barbuda};{ Antigva i Barbuda; Antigva i Barbuda};{ Antigua och Barbuda; Antigua och Barbuda};{ Antigua ve Barbuda; Antigua ve Barbuda};{·انوا واربوا;·انوا واربوا};{;}};[ 17.05; -61.8];false;[]; 442;;{{ Antiguan, Barbudan; Antiguan, Barbudan};{ Antiguaise et barbudienne; Antiguaise et barbudien}}
{ Australia; Commonwealth of Australia;{ eng:{ official: Commonwealth of Australia; common: Australia}}};[ .au]; AU; 036; AUS; AUS;true; officially-assigned;true; Western European and Others Group;{ AUD:{ name: Australian dollar; symbol: $}};{ +6;[ 1]};[ Canberra];[ AU]; Oceania; Australia and New Zealand;{ eng: English};{{ومونولستراليا;ستراليا};{ Kenglad Aostralia; Aostralia};{ Australské společenství; Austrálie};{ Commonwealth Australien; Australien};{ Austraalia Ühendus; Austraalia};{ Australian liittovaltio; Australia};{ Australie; Australie};{ Commonwealth of Australia; Australija};{ Ausztrálllamszövetség; Ausztrália};{ Commonwealth dell'Australia; Australia};{スト;スト};{;·};{ Gemenebest van Australië; Australië};{لمرومسود·ا�ترالا;·ا�ترالا};{ Zwizek Australijski; Australia};{ Comunidade da Austrália; Austrália};{о�руествовстралии;встралия};{ Austrálsky zväz; Austrália};{ Mancomunidad de Australia; Australia};{ Komonvelt Australija; Australija};{ Australiska statsförbundet; Australien};{ Avustralya Federal Devleti; Avustralya};{ولتِ مترسرلا;سرلا};{;}};[ -27; 133];false;[]; 7692024;;{{ Australian; Australian};{ Australienne; Australien}}
{ Austria; Republic of Austria;{ bar:{ official: Republik Österreich; common: Österreich}}};[ .at]; AT; 040; AUT; AUT;true; officially-assigned;true; Western European and Others Group;{ EUR:{ name: Euro; symbol:}};{ +4;[ 3]};[ Vienna];[ AT; Osterreich; Oesterreich]; Europe; Central Europe;{ bar: Austro-Bavarian German};{{مهورية النمسا; النمسا};{ Republik Aostria; Aostria};{ Rakouská republika; Rakousko};{ Republik Österreich; Österreich};{ Austria Vabariik; Austria};{ Itävallan tasavalta; Itävalta};{publique d'Autriche; Autriche};{ Republika Austrija; Austrija};{ Ausztria; Ausztria};{ Repubblica d'Austria; Austria};{スト;スト};{·;};{ Republiek Oostenrijk; Oostenrijk};{مهور·ا�ر;·ا�ر};{ Republika Austrii; Austria};{ República daustria;ustria};{встрискаяесулика;встрия};{ Rakúska republika; Rakúsko};{ República de Austria; Austria};{ Republika Austrija; Austrija};{ Republiken Österrike; Österrike};{ Avusturya Cumhuriyeti; Avusturya};{مورسرا;سرا};{;}};[ 47.33333333; 13.33333333];true;[ CZE; DEU; HUN; ITA; LIE; SVK; SVN; CHE]; 83871;;{{ Austrian; Austrian};{ Autrichienne; Autrichien}}
{ Azerbaijan; Republic of Azerbaijan;{ aze:{ official: Azrbaycan Respublikası; common: Azrbaycan}; rus:{ official:ераданскаяесулика; common:ерадан}}};[ .az]; AZ; 031; AZE; AZE;true; officially-assigned;true; Eastern European Group;{ AZN:{ name: Azerbaijani manat; symbol:}};{ +9;[ 94]};[ Baku];[ AZ; Republic of Azerbaijan; Azrbaycan Respublikası]; Asia; Western Asia;{ aze: Azerbaijani; rus: Russian};{{مهوريةربيان;ربيان};{ Republik Azerbaidjan; Azerbaidjan};{zerbájdánská republika;zerbájdán};{ Republik Aserbaidschan; Aserbaidschan};{ Aserbaidaani Vabariik; Aserbaidaan};{ Azerbaidzanin tasavalta; Azerbaidzan};{publique d'Azerbaïdjan; Azerbaïdjan};{ Republika Azerbajdan; Azerbajdan};{ Azerbajdzsán; Azerbajdzsán};{ Repubblica dell'Azerbaigian; Azerbaijan};{·;·};{·;};{ Republiek Azerbeidzjan; Azerbeidzjan};{مهوررباان;مهوررباان};{ Republika Azerbejdanu; Azerbejdan};{ República do Azerbaijão; Azerbeijão};{ераданскаяесулика;ерадан};{ Azerbajanská republika; Azerbajan};{ República de Azerbaiyán; Azerbaiyán};{ Republika Azerbejdan; Azerbejdan};{ Republiken Azerbajdzjan; Azerbajdzjan};{ Azerbaycan Cumhuriyeti; Azerbaycan};{مورربا�ان;ربا�ان};{;}};[ 40.5; 47.5];true;[ ARM; GEO; IRN; RUS; TUR]; 86600;;{{ Azerbaijani; Azerbaijani};{ Azerbaïdjanaise; Azerbaïdjanais}}
{ Burundi; Republic of Burundi;{ fra:{ official:publique du Burundi; common: Burundi}; run:{ official: Republika y'Uburundi ; common: Uburundi}}};[ .bi]; BI; 108; BDI; BDI;true; officially-assigned;true; African Group;{ BIF:{ name: Burundian franc; symbol: Fr}};{ +2;[ 57]};[ Gitega];[ BI; Republic of Burundi; Republika y'Uburundi;publique du Burundi]; Africa; Eastern Africa;{ fra: French; run: Kirundi};{{مهوريةوروندي;وروندي};{ Republik Burundi; Burundi};{ Burundská republika; Burundi};{ Republik Burundi; Burundi};{ Burundi Vabariik; Burundi};{ Burundin tasavalta; Burundi};{publique du Burundi; Burundi};{ Burundi; Burundi};{ Burundi; Burundi};{ Repubblica del Burundi; Burundi};{ンジ;ンジ};{;};{ Republiek Burundi; Burundi};{مهوروروند;وروند};{ Republika Burundi; Burundi};{ República do Burundi; Burundi};{есуликаурунди;урунди};{ Burundská republika; Burundi};{ República de Burundi; Burundi};{ Republika Burundi; Burundi};{ Republiken Burundi; Burundi};{ Burundi Cumhuriyeti; Burundi};{موررون;رون};{;}};[ -3.5; 30];true;[ COD; RWA; TZA]; 27834;;{{ Burundian; Burundian};{ Burundaise; Burundais}}
{ Belgium; Kingdom of Belgium;{ deu:{ official: Königreich Belgien; common: Belgien}; fra:{ official: Royaume de Belgique; common: Belgique}; nld:{ official: Koninkrijk België; common: België}}};[ .be]; BE; 056; BEL; BEL;true; officially-assigned;true; Western European and Others Group;{ EUR:{ name: Euro; symbol:}};{ +3;[ 2]};[ Brussels];[ BE; België; Belgie; Belgien; Belgique; Kingdom of Belgium; Koninkrijk België; Royaume de Belgique; Königreich Belgien]; Europe; Western Europe;{ deu: German; fra: French; nld: Dutch};{{ مملةليا;ليا};{ Rouantelezh Belgia; Belgia};{ Belgické království; Belgie};{ Königreich Belgien; Belgien};{ Belgia Kuningriik; Belgia};{ Belgian kuningaskunta; Belgia};{ Royaume de Belgique; Belgique};{ Kraljevina Belgija; Belgija};{ Belga Királyság; Belgium};{ Regno del Belgio; Belgio};{;};{;};{ Koninkrijk België; België};{ا�اهل;ل};{ Królestwo Belgii; Belgia};{ Reino da Bélgica; Bélgica};{оро�евствоельия;ельия};{ Belgické kráovstvo; Belgicko};{ Reino de Bélgica; Bélgica};{ Kraljevina Belgija; Belgija};{ Konungariket Belgien; Belgien};{ Belçika Krallığı; Belçika};{ مملتِلم;لم};{;}};[ 50.83333333; 4];false;[ FRA; DEU; LUX; NLD]; 30528;;{{ Belgian; Belgian};{ Belge; Belge}}
{ Benin; Republic of Benin;{ fra:{ official:publique du Bénin; common: Bénin}}};[ .bj]; BJ; 204; BEN; BEN;true; officially-assigned;true; African Group;{ XOF:{ name: West African CFA franc; symbol: Fr}};{ +2;[ 29]};[ Porto-Novo];[ BJ; Republic of Benin;publique du Bénin]; Africa; Western Africa;{ fra: French};{{مهوريةنين;نين};{ Republik Benin; Benin};{ Beninská republika; Benin};{ Republik Benin; Benin};{ Benini Vabariik; Benin};{ Beninin tasavalta; Benin};{publique du Bénin; Bénin};{ Republika Benin; Benin};{ Benini Köztársaság; Benin};{ Repubblica del Benin; Benin};{;};{·;};{ Republiek Benin; Benin};{مهورنن;نن};{ Benin; Benin};{ República do Benin; Benin};{есуликаенин;енин};{ Beninská republika; Benin};{ República de Benin; Benín};{ Republika Benin; Benin};{ Republiken Benin; Benin};{ Benin Cumhuriyeti; Benin};{مورنن;نن};{;}};[ 9.5; 2.25];false;[ BFA; NER; NGA; TGO]; 112622;;{{ Beninese; Beninese};{ Béninoise; Béninois}}
{ Burkina Faso; Burkina Faso;{ fra:{ official:publique du Burkina; common: Burkina Faso}}};[ .bf]; BF; 854; BFA; BUR;true; officially-assigned;true; African Group;{ XOF:{ name: West African CFA franc; symbol: Fr}};{ +2;[ 26]};[ Ouagadougou];[ BF]; Africa; Western Africa;{ fra: French};{{وريناا�و;وريناا�و};{ Burkina Faso; Burkina Faso};{ Burkina Faso; Burkina Faso};{ Burkina Faso; Burkina Faso};{ Burkina Faso; Burkina Faso};{ Burkina Faso; Burkina Faso};{publique du Burkina; Burkina Faso};{ Burkina Faso; Burkina Faso};{ Burkina Faso; Burkina};{ Burkina Faso; Burkina Faso};{ファ;ファ};{;};{ Burkina Faso; Burkina Faso};{ورناا�و;ورناا�و};{ Burkina Faso; Burkina Faso};{ Burkina Faso; Burkina Faso};{уркина -асо;уркина-асо};{ Burkina Faso; Burkina Faso};{ Burkina Faso; Burkina Faso};{ Burkina Faso; Burkina Faso};{ Burkina Faso; Burkina Faso};{ Burkina Faso; Burkina Faso};{رناا�و;رناا�و};{;}};[ 13; -2];true;[ BEN; CIV; GHA; MLI; NER; TGO]; 272967;;{{ Burkinabe; Burkinabe};{ Burkinabée; Burkinabé}}
{ Bangladesh; People's Republic of Bangladesh;{ ben:{ official:··; common:·}}};[ .bd]; BD; 050; BGD; BAN;true; officially-assigned;true; Asia and the Pacific Group;{ BDT:{ name: Bangladeshi taka; symbol:·}};{ +8;[ 80]};[ Dhaka];[ BD; People's Republic of Bangladesh; Gônôprôjatôntri Bangladesh]; Asia; Southern Asia;{ ben: Bengali};{{مهوريةنلا�ي العبية;نلا�ي};{ Republik pobl Bangladesh; Bangladesh};{ Bangladéšská lidová republika; Bangladéš};{ Volksrepublik Bangladesch; Bangladesch};{ Bangladeshi Rahvavabariik; Bangladesh};{ Bangladeshin kansantasavalta; Bangladesh};{ Lapublique populaire du Bangladesh; Bangladesh};{ Narodna Republika Bangladeš; Bangladeš};{ Banglades; Banglades};{ Repubblica popolare del Bangladesh; Bangladesh};{;};{·;};{ Volksrepubliek Bangladesh; Bangladesh};{مهورلنلا�;نلا�};{ Ludowa Republika Bangladeszu; Bangladesz};{ República Popular do Bangladesh; Bangladesh};{аро�наяесуликаанладе;анладе};{ Bangladéšskaudová republika; Bangladéš};{ República Popular de Bangladesh; Bangladesh};{ Narodna Republika Bangladeš; Bangladeš};{ Folkrepubliken Bangladesh; Bangladesh};{ Bangladeş Halk Cumhuriyeti; Bangladeş};{واممورنل;نل};{;}};[ 24; 90];false;[ MMR; IND]; 147570;;{{ Bangladeshi; Bangladeshi};{ Bangladaise; Bangladais}}
{ Bulgaria; Republic of Bulgaria;{ bul:{ official:еуликалария; common:лария}}};[ .bg]; BG; 100; BGR; BUL;true; officially-assigned;true; Eastern European Group;{ BGN:{ name: Bulgarian lev; symbol:в}};{ +3;[ 59]};[ Sofia];[ BG; Republic of Bulgaria;еуликалария]; Europe; Southeast Europe;{ bul: Bulgarian};{{مهوريةلاريا;لاريا};{ Republik Bulgaria; Bulgaria};{ Bulharská republika; Bulharsko};{ Republik Bulgarien; Bulgarien};{ Bulgaaria Vabariik; Bulgaaria};{ Bulgarian tasavalta; Bulgaria};{publique de Bulgarie; Bulgarie};{ Republika Bugarska; Bugarska};{ Bolgár Köztársaság; Bulgária};{ Repubblica di Bulgaria; Bulgaria};{;};{·;};{ Republiek Bulgarije; Bulgarije};{مهورلارستان;لارستان};{ Republika Bułgarii; Bułgaria};{ República da Bulgária; Bulgária};{есуликао�ария;о�ария};{ Bulharská republika; Bulharsko};{ República de Bulgaria; Bulgaria};{ Republika Bugarska; Bugarska};{ Republiken Bulgarien; Bulgarien};{ Bulgaristan Cumhuriyeti; Bulgaristan};{مورلار;لار};{·;·}};[ 43; 25];false;[ GRC; MKD; ROU; SRB; TUR]; 110879;;{{ Bulgarian; Bulgarian};{ Bulgare; Bulgare}}
{ Bahrain; Kingdom of Bahrain;{ ara:{ official: مملة البرين; common: البرين}}};[ .bh]; BH; 048; BHR; BRN;true; officially-assigned;true; Asia and the Pacific Group;{ BHD:{ name: Bahraini dinar; symbol: .د.ب}};{ +9;[ 73]};[ Manama];[ BH; Kingdom of Bahrain; Mamlakat al-Barayn]; Asia; Western Asia;{ ara: Arabic};{{ مملة البرين; البرين};{ Rouantelezh Bahrein; Bahrein};{ Království Bahrajn; Bahrajn};{ Königreich Bahrain; Bahrain};{ Bahreini Kuningriik; Bahrein};{ Bahrainin kuningaskunta; Bahrain};{ Royaume de Bahreïn; Bahreïn};{ Kraljevina Bahrein; Bahrein};{ Bahreini Királyság; Bahrein};{ Regno del Bahrain; Bahrein};{ー�ーン;ー�ーン};{;};{ Koninkrijk Bahrein; Bahrein};{ا�اهرن;رن};{ Królestwo Bahrajnu; Bahrajn};{ Reino do Bahrein; Bahrein};{оро�евствоарен;арен};{ Bahrajnské kráovstvo; Bahrajn};{ Reino de Bahrein; Bahrein};{ Kraljevina Bahrein; Bahrein};{ Konungariket Bahrain; Bahrain};{ Bahreyn Krallığı; Bahreyn};{ مملتِرن;رن};{;}};[ 26; 50.55];false;[]; 765;;{{ Bahraini; Bahraini};{ Bahreïnienne; Bahreïnien}}
... (truncated)
minemizer (compact)
chars: 299,485 tokens: 170,841 chars_og/tok: 6.6 enc_chars/tok: 1.8
name{common;official;native{...}};tld[];cca2;ccn3;cca3;cioc;independent;status;unMember;unRegionalGroup;currencies{...};idd{root;suffixes[]};capital[];altSpellings[];region;subregion;languages{...};translations{ara{official;common};bre{official;common};ces{official;common};deu{official;common};est{official;common};fin{official;common};fra{official;common};hrv{official;common};hun{official;common};ita{official;common};jpn{official;common};kor{official;common};nld{official;common};per{official;common};pol{official;common};por{official;common};rus{official;common};slk{official;common};spa{official;common};srp{official;common};swe{official;common};tur{official;common};urd{official;common};zho{official;common}};latlng[];landlocked;borders[];area;flag;demonyms{eng{f;m};fra{f;m}}
{Aruba;Aruba;{nld:{official:Aruba;common:Aruba};pap:{official:Aruba;common:Aruba}}};[.aw];AW;533;ABW;ARU;false;officially-assigned;false;;{AWG:{name:Aruban florin;symbol:}};{+2;[97]};[Oranjestad];[AW];Americas;Caribbean;{nld:Dutch;pap:Papiamento};{{روبا;روبا};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{アル;アル};{;};{Aruba;Aruba};{روبا;روبا};{Aruba;Aruba};{Aruba;Aruba};{руа;руа};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{اروبا;اروبا};{;}};[12.5;-69.96666666];false;[];180;;{{Aruban;Aruban};{Arubaise;Arubais}}
{Afghanistan;Islamic Republic of Afghanistan;{prs:{official:مهور·ا�لام·اانستان;common:اانستان};pus:{official:د·اانستان·ا�لاميمهورت;common:اانستان};tuk:{official:Owganystan Yslam Respublikasy;common:Owganystan}}};[.af];AF;004;AFG;AFG;true;officially-assigned;true;Asia and the Pacific Group;{AFN:{name:Afghan afghani;symbol:}};{+9;[3]};[Kabul];[AF;Afānistān];Asia;Southern Asia;{prs:Dari;pus:Pashto;tuk:Turkmen};{{مهوريةانستان السلامية;انستان};{Republik Islamek Afghanistan;Afghanistan};{Afghánská islámská republika;Afghánistán};{Islamische Republik Afghanistan;Afghanistan};{Afganistani Islamivabariik;Afganistan};{Afganistanin islamilainen tasavalta;Afganistan};{République islamique d'Afghanistan;Afghanistan};{Islamska Republika Afganistan;Afganistan};{Afganisztáni Iszlám Köztársaság;Afganisztán};{Repubblica islamica dell'Afghanistan;Afghanistan};{;};{·;};{Islamitische Republiek Afghanistan;Afghanistan};{مهور·ا�لام·اانستان;اانستان};{Islamska Republika Afganistanu;Afganistan};{República Islâmica do Afeganistão;Afeganistão};{сламскаяесуликаанистан;анистан};{Afgánsky islamsktát;Afganistan};{República Islámica de Afganistán;Afganistán};{Islamska Republika Avganistan;Avganistan};{Islamiska republiken Afghanistan;Afghanistan};{Afganistanslam Cumhuriyeti;Afganistan};{ا�لاممور·اانستان;اانستان};{;}};[33;65];true;[IRN;PAK;TKM;UZB;TJK;CHN];652230;;{{Afghan;Afghan};{Afghane;Afghan}}
{Angola;Republic of Angola;{por:{official:República de Angola;common:Angola}}};[.ao];AO;024;AGO;ANG;true;officially-assigned;true;African Group;{AOA:{name:Angolan kwanza;symbol:Kz}};{+2;[44]};[Luanda];[AO;República de Angola;publika de an'la];Africa;Middle Africa;{por:Portuguese};{{نولا;مهوريةنولا};{Republik Angola;Angola};{Angolská republika;Angola};{Republik Angola;Angola};{Angola Vabariik;Angola};{Angolan tasavalta;Angola};{République d'Angola;Angola};{Republika Angola;Angola};{Angola;Angola};{Repubblica dell'Angola;Angola};{;};{·;};{Republiek Angola;Angola};{مهورنولا;نولا};{Republika Angoli;Angola};{República de Angola;Angola};{есуликано�а;но�а};{Angolská republika;Angola};{República de Angola;Angola};{Republika Angola;Angola};{Republiken Angola;Angola};{Angola Cumhuriyeti;Angola};{مور·انول;انول};{;}};[-12.5;18.5];false;[COG;COD;ZMB;NAM];1246700;;{{Angolan;Angolan};{Angolaise;Angolais}}
{Anguilla;Anguilla;{eng:{official:Anguilla;common:Anguilla}}};[.ai];AI;660;AIA;;false;officially-assigned;false;;{XCD:{name:Eastern Caribbean dollar;symbol:$}};{+1;[264]};[The Valley];[AI];Americas;Caribbean;{eng:English};{{نويلا;نويلا};{Anguilla;Anguilla};{Anguilla;Anguilla};{Anguilla;Anguilla};{Anguilla;Anguilla};{Anguilla;Anguilla};{Anguilla;Anguilla};{Anguilla;Angvila};{Anguilla;Anguilla};{Anguilla;Anguilla};{;};{;};{Anguilla;Anguilla};{نولا;نولا};{Anguilla;Anguilla};{Anguilla;Anguilla};{нилья;нилья};{Anguilla;Anguilla};{Anguila;Anguilla};{Angvila;Angvila};{Anguilla;Anguilla};{Anguilla;Anguilla};{انولا;انولا};{;}};[18.25;-63.16666666];false;[];91;;{{Anguillian;Anguillian};{Anguillane;Anguillan}}
{land Islands;land Islands;{swe:{official:Landskapetland;common:land}}};[.ax];AX;248;ALA;;false;officially-assigned;false;;{EUR:{name:Euro;symbol:}};{+3;[5818]};[Mariehamn];[AX;Aaland;Aland;Ahvenanmaa];Europe;Northern Europe;{swe:Swedish};{{رولاند;رولاند};{Iniziland;land};{landské ostrovy;landy};{land-Inseln;land};{Ahvenamaa maakond;Ahvenamaa};{Ahvenanmaan maakunta;Ahvenanmaa};{Ahvenanmaa;Ahvenanmaa};{Aland Islands;landski otoci};{land-szigetek;land-szigetek};{Isoleland;Isole Aland};{ラン;ラン};{;};{land eilanden;landeilanden};{ار الند;ار الند};{Wyspy Alandzkie;Wyspy Alandzkie};{Ilhasland;Alândia};{ландскиестро�а;ландскиестро�а};{Alandské ostrovy;Alandy};{Islasland;Alandia};{Olandska Ostrva;Olandska Ostrva};{land;land};{land Adaları;land};{ا�ر·اولند;ا�ر·اولند};{;}};[60.116667;19.9];false;[];1580;;{{landish;landish};{landaise;landais}}
{Albania;Republic of Albania;{sqi:{official:Republika e Shqipërisë;common:Shqipëria}}};[.al];AL;008;ALB;ALB;true;officially-assigned;true;Eastern European Group;{ALL:{name:Albanian lek;symbol:L}};{+3;[55]};[Tirana];[AL;Shqipëri;Shqipëria;Shqipnia];Europe;Southeast Europe;{sqi:Albanian};{{مهوريةلبانيا;لبانيا};{Republik Albania;Albania};{Albánská republika;Albánie};{Republik Albanien;Albanien};{Albaania Vabariik;Albaania};{Albanian tasavalta;Albania};{République d'Albanie;Albanie};{Republika Albanija;Albanija};{Albán Köztársaság;Albánia};{Repubblica d'Albania;Albania};{アル;アル};{·;};{Republiek Albanië;Albanië};{مهورلبان;لبان};{Republika Albanii;Albania};{República da Albânia;Albânia};{есуликалания;лания};{Albánska republika;Albánsko};{República de Albania;Albania};{Republika Albanija;Albanija};{Republiken Albanien;Albanien};{Arnavutluk Cumhuriyeti;Arnavutluk};{مور البانا;البانا};{;}};[41;20];false;[MNE;GRC;MKD;UNK];28748;;{{Albanian;Albanian};{Albanaise;Albanais}}
{Andorra;Principality of Andorra;{cat:{official:Principat d'Andorra;common:Andorra}}};[.ad];AD;020;AND;AND;true;officially-assigned;true;Western European and Others Group;{EUR:{name:Euro;symbol:}};{+3;[76]};[Andorra la Vella];[AD;Principality of Andorra;Principat d'Andorra];Europe;Southern Europe;{cat:Catalan};{{مارةندورا;ندورا};{Priñselezh Andorra;Andorra};{Andorrské kníectví;Andorra};{Fürstentum Andorra;Andorra};{Andorra Vürstiriik;Andorra};{Andorran ruhtinaskunta;Andorra};{Principauté d'Andorre;Andorre};{Kneevina Andora;Andora};{Andorra;Andorra};{Principato di Andorra;Andorra};{ドラ;ドラ};{·;};{Prinsdom Andorra;Andorra};{اها�هننندورا;ندورا};{Ksistwo Andory;Andora};{Principado de Andorra;Andorra};{няествондорра;ндорра};{Andorrské knieatstvo;Andorra};{Principado de Andorra;Andorra};{Kneevina Andora;Andora};{Furstendömet Andorra;Andorra};{Andorra Prensliği;Andorra};{امارا�ِ·انورا;انورا};{;}};[42.5;1.5];true;[FRA;ESP];468;;{{Andorran;Andorran};{Andorrane;Andorran}}
{United Arab Emirates;United Arab Emirates;{ara:{official:المارا� العربية المتدة;common:المارا�}}};[.ae;امارا�.];AE;784;ARE;UAE;true;officially-assigned;true;Asia and the Pacific Group;{AED:{name:United Arab Emirates dirham;symbol:د.}};{+9;[71]};[Abu Dhabi];[AE;UAE;Emirates];Asia;Western Asia;{ara:Arabic};{{المارا� العربية المتدة;المارا�};{Emirelezhio Arab Unanet;Emirelezhio Arab Unanet};{Spojené arabské emiráty;Spojené arabské emiráty};{Vereinigte Arabische Emirate;Vereinigte Arabische Emirate};{Araabia Ühendemiraadid;Araabia Ühendemiraadid};{Yhdistyneet arabiemiirikunnat;Arabiemiraatit};{Émirats arabes unis;Émirats arabes unis};{Ujedinjeni Arapski Emirati;Ujedinjeni Arapski Emirati};{Egyesült Arab Emírségek;Egyesült Arab Emírségek};{Emirati Arabi Uniti;Emirati Arabi Uniti};{;UAE};{·;};{Verenigde Arabische Emiraten;Verenigde Arabische Emiraten};{امارا� متدهرب;امارا�};{Zjednoczone Emiraty Arabskie;Zjednoczone Emiraty Arabskie};{Emiradosrabes Unidos;Emiradosrabes Unidos};{единенныераскиемираты;единнныераскиемираты};{Spojené arabské emiráty;Spojené arabské emiráty};{Emiratosrabes Unidos;Emiratosrabes Unidos};{Ujedinjeni Arapski Emirati;Ujedinjeni Arapski Emirati};{Förenade Arabemiraten;Förenade Arabemiraten};{Birleşik Arap Emirlikleri;Birleşik Arap Emirlikleri};{متدرب·امارا�;متدرب·امارا�};{��;��}};[24;54];false;[OMN;SAU];83600;;{{Emirati;Emirati};{Emirienne;Emirien}}
{Argentina;Argentine Republic;{grn:{official:Argentine Republic;common:Argentina};spa:{official:República Argentina;common:Argentina}}};[.ar];AR;032;ARG;ARG;true;officially-assigned;true;Latin American and Caribbean Group;{ARS:{name:Argentine peso;symbol:$}};{+5;[4]};[Buenos Aires];[AR;Argentine Republic;República Argentina];Americas;South America;{grn:Guaraní;spa:Spanish};{{مهورية الرنتين;الرنتين};{Republik Arc'hantina;Arc'hantina};{Argentinská republika;Argentina};{Argentinische Republik;Argentinien};{Argentina Vabariik;Argentina};{Argentiinan tasavalta;Argentiina};{République argentine;Argentine};{Argentinski Republika;Argentina};{Argentin Köztársaság;Argentína};{Repubblica Argentina;Argentina};{アル;アル};{·;};{Argentijnse Republiek;Argentinië};{مهوررانتن;رانتن};{Republika Argentyska;Argentyna};{República Argentina;Argentina};{рентинскаяесулика;рентина};{Argentínska republika;Argentína};{República Argentina;Argentina};{Republika Argentina;Argentina};{Republiken Argentina;Argentina};{Arjantin Cumhuriyeti;Arjantin};{مور·ارنا�ن;ارنا�ن};{;}};[-34;-64];false;[BOL;BRA;CHL;PRY;URY];2780400;;{{Argentine;Argentine};{Argentine;Argentin}}
{Armenia;Republic of Armenia;{hye:{official:·;common:}}};[.am];AM;051;ARM;ARM;true;officially-assigned;true;Eastern European Group;{AMD:{name:Armenian dram;symbol:}};{+3;[74]};[Yerevan];[AM;Hayastan;Republic of Armenia;·];Asia;Western Asia;{hye:Armenian};{{مهوريةرمينيا;رمينيا};{Republik Armenia;Armenia};{Arménská republika;Arménie};{Republik Armenien;Armenien};{Armeenia Vabariik;Armeenia};{Armenian tasavalta;Armenia};{République d'Arménie;Arménie};{Republika Armenija;Armenija};{rményország;rményország};{Repubblica di Armenia;Armenia};{アル;アル};{·;};{Republiek Armenië;Armenië};{مهور·ارمنستان;ارمنستان};{Republika Armenii;Armenia};{República da Arménia;Arménia};{есуликармения;рмения};{Arménska republika;Arménsko};{República de Armenia;Armenia};{Republika Jermenija;Jermenija};{Republiken Armenien;Armenien};{Ermenistan Cumhuriyeti;Ermenistan};{موررمنا;رمنا};{;}};[40;45];true;[AZE;GEO;IRN;TUR];29743;;{{Armenian;Armenian};{Arménienne;Arménien}}
{American Samoa;American Samoa;{eng:{official:American Samoa;common:American Samoa};smo:{official:Sāmoa Amelika;common:Sāmoa Amelika}}};[.as];AS;016;ASM;ASA;false;officially-assigned;false;;{USD:{name:United States dollar;symbol:$}};{+1;[684]};[Pago Pago];[AS;Amerika Sāmoa;Amelika Sāmoa;Sāmoa Amelika];Oceania;Polynesia;{eng:English;smo:Samoan};{{ساموا المريية;ساموا المريية};{Samoa Amerikan;Samoa Amerikan};{Americká Samoa;Americká Samoa};{Amerikanisch-Samoa;Amerikanisch-Samoa};{Ameerika Samoa;Ameerika Samoa};{Amerikan Samoa;Amerikan Samoa};{Samoa américaines;Samoa américaines};{američka Samoa;Američka Samoa};{Szamoa;Szamoa};{Samoa americane;Samoa Americane};{;};{��;��};{Amerikaans Samoa;Amerikaans Samoa};{سامومرا;سامومرا};{Samoa Amerykaskie;Samoa Amerykaskie};{Samoa americana;Samoa Americana};{американскоеамоа;мериканскоеамоа};{Americká Samoa;Americká Samoa};{Samoa Americana;Samoa Americana};{Američka Samoa;Američka Samoa};{Amerikanska Samoa;Amerikanska Samoa};{Amerikan Samoası;Amerikan Samoası};{امرمووا;امرمووا};{;}};[-14.33333333;-170];false;[];199;;{{American Samoan;American Samoan};{Samoane;Samoan}}
{Antarctica;Antarctica;{}};[.aq];AQ;010;ATA;;false;officially-assigned;false;;{};{;[]};[];[AQ];Antarctic;;{};{{نتارتيا;نتارتيا};{Antarktika;Antarktika};{Antarktida;Antarktida};{Antarktika;Antarktis};{Antarktika;Antarktika};{Etelämanner;Etelämanner};{Antarctique;Antarctique};{Antarktika;Antarktika};{Antarktisz;Antarktisz};{Antartide;Antartide};{��;��};{;};{Antarctica;Antarctica};{نوبان;نوبان};{Antarktyka;Antarktyka};{Antártica;Antártida};{нтарктида;нтарктида};{Antarktída;Antarktída};{Antártida;Antártida};{Antarktik;Antarktik};{Antarktis;Antarktis};{Antarktika;Antarktika};{انارا;انارا};{;}};[-90;0];false;[];14000000;;{{Antarctican;Antarctican};{Antarcticaine;Antarcticain}}
{French Southern and Antarctic Lands;Territory of the French Southern and Antarctic Lands;{fra:{official:Territoire des Terres australes et antarctiques françaises;common:Terres australes et antarctiques françaises}}};[.tf];TF;260;ATF;;false;officially-assigned;false;;{EUR:{name:Euro;symbol:}};{+2;[62]};[Port-aux-Français];[TF;French Southern Territories];Antarctic;;{fra:French};{{ما�عا� واليم ما ورا� البار الرنسية;را�رنسيةنوبية ونتارتيية};{Tiriad Douaro Aostral hag Antarktikel Frañs;Douaro Aostral hag Antarktikel Frañs};{Teritorium Francouzská jiní a antarktickázemí;Francouzská jiní a antarktickázemí};{Gebiet der Französisch Süd- und Antarktisgebiete;Französische Süd- und Antarktisgebiete};{Prantsuse Lunaalad;Prantsuse Lunaalad};{Ranskan eteläiset ja antarktiset alueet;Ranskan eteläiset ja antarktiset alueet};{Territoire des Terres australes et antarctiques françaises;Terres australes et antarctiques françaises};{Teritoriju Francuski juni i antarktički teritoriji;Francuski juni i antarktički teritoriji};{Franciali·és antarktiszi területek;Franciali·és antarktiszi területek};{Territorio della australi e antartiche francesi Terre;Territori Francesi del Sud};{ラン��;ラン��};{;};{Grondgebied van de Franse Zuidelijke en Antarctische gebieden;Franse Gebieden in de zuidelijke Indische Oceaan};{سرمنهانوب ونوبانرانسه;سرمنهانوب ونوبانرانسه};{Francuskie Terytoria Południowe i Antarktyczne;Francuskie Terytoria Południowe i Antarktyczne};{Território do Sul e Antártica Francesa;Terras Austrais e Antárticas Francesas};{ерриторияранускиеныентарктиескиеемли;ранускиеныентарктиеские·территории};{Francúzske juné a antarktickézemia;Francúzske juné a antarktickézemia};{Territorio del Francés Tierras australes y antárticas;Tierras Australes y Antárticas Francesas};{Francuske june i antarktičke zemlje;Francuske june i antarktičke zemlje};{Franska syd- och Antarktisterritorierna;Franska södra territorierna};{Fransız Güney ve Antarktika Toprakları;Fransız Güney ve Antarktika Toprakları};{سرمنِنوبرانسس و·انار;سرمننوبرانسس و·انارا};{;}};[-49.25;69.167];false;[];7747;;{{French;French};{Française;Français}}
{Antigua and Barbuda;Antigua and Barbuda;{eng:{official:Antigua and Barbuda;common:Antigua and Barbuda}}};[.ag];AG;028;ATG;ANT;true;officially-assigned;true;Latin American and Caribbean Group;{XCD:{name:Eastern Caribbean dollar;symbol:$}};{+1;[268]};[Saint John's];[AG];Americas;Caribbean;{eng:English};{{نتيوا وباربودا;نتيوا وباربودا};{Antigua ha Barbuda;Antigua ha Barbuda};{Antigua a Barbuda;Antigua a Barbuda};{Antigua und Barbuda;Antigua und Barbuda};{Antigua ja Barbuda;Antigua ja Barbuda};{Antigua ja Barbuda;Antigua ja Barbuda};{Antigua -et-Barbuda;Antigua-et-Barbuda};{Antigva i Barbuda;Antigva i Barbuda};{Antigua·és Barbuda;Antigua·és Barbuda};{Antigua e Barbuda;Antigua e Barbuda};{ティー�ー�;ティー�ー�};{;};{Antigua en Barbuda;Antigua en Barbuda};{نتوا واربودا;نتوا واربودا};{Antigua i Barbuda;Antigua i Barbuda};{Antigua e Barbuda;Antígua e Barbuda};{нтиуааруда;нтиуааруда};{Antigua a Barbuda;Antigua a Barbuda};{Antigua y Barbuda;Antigua y Barbuda};{Antigva i Barbuda;Antigva i Barbuda};{Antigua och Barbuda;Antigua och Barbuda};{Antigua ve Barbuda;Antigua ve Barbuda};{انوا واربوا;انوا واربوا};{;}};[17.05;-61.8];false;[];442;;{{Antiguan, Barbudan;Antiguan, Barbudan};{Antiguaise et barbudienne;Antiguaise et barbudien}}
{Australia;Commonwealth of Australia;{eng:{official:Commonwealth of Australia;common:Australia}}};[.au];AU;036;AUS;AUS;true;officially-assigned;true;Western European and Others Group;{AUD:{name:Australian dollar;symbol:$}};{+6;[1]};[Canberra];[AU];Oceania;Australia and New Zealand;{eng:English};{{ومونولستراليا;ستراليا};{Kenglad Aostralia;Aostralia};{Australské společenství;Austrálie};{Commonwealth Australien;Australien};{Austraalia Ühendus;Austraalia};{Australian liittovaltio;Australia};{Australie;Australie};{Commonwealth of Australia;Australija};{Ausztrálllamszövetség;Ausztrália};{Commonwealth dell'Australia;Australia};{スト;スト};{;};{Gemenebest van Australië;Australië};{لمرومسود·ا�ترالا;ا�ترالا};{Zwizek Australijski;Australia};{Comunidade da Austrália;Austrália};{о�руествовстралии;встралия};{Austrálsky zväz;Austrália};{Mancomunidad de Australia;Australia};{Komonvelt Australija;Australija};{Australiska statsförbundet;Australien};{Avustralya Federal Devleti;Avustralya};{دولتِ مترسرلا;سرلا};{;}};[-27;133];false;[];7692024;;{{Australian;Australian};{Australienne;Australien}}
{Austria;Republic of Austria;{bar:{official:Republik Österreich;common:sterreich}}};[.at];AT;040;AUT;AUT;true;officially-assigned;true;Western European and Others Group;{EUR:{name:Euro;symbol:}};{+4;[3]};[Vienna];[AT;Osterreich;Oesterreich];Europe;Central Europe;{bar:Austro-Bavarian German};{{مهورية النمسا;النمسا};{Republik Aostria;Aostria};{Rakouská republika;Rakousko};{Republik Österreich;sterreich};{Austria Vabariik;Austria};{Itävallan tasavalta;Itävalta};{République d'Autriche;Autriche};{Republika Austrija;Austrija};{Ausztria;Ausztria};{Repubblica d'Austria;Austria};{スト;スト};{·;};{Republiek Oostenrijk;Oostenrijk};{مهور·ا�ر;ا�ر};{Republika Austrii;Austria};{República daustria;ustria};{встрискаяесулика;встрия};{Rakúska republika;Rakúsko};{República de Austria;Austria};{Republika Austrija;Austrija};{Republiken Österrike;sterrike};{Avusturya Cumhuriyeti;Avusturya};{مورسرا;سرا};{;}};[47.33333333;13.33333333];true;[CZE;DEU;HUN;ITA;LIE;SVK;SVN;CHE];83871;;{{Austrian;Austrian};{Autrichienne;Autrichien}}
{Azerbaijan;Republic of Azerbaijan;{aze:{official:Azrbaycan Respublikası;common:Azrbaycan};rus:{official:ераданскаяесулика;common:ерадан}}};[.az];AZ;031;AZE;AZE;true;officially-assigned;true;Eastern European Group;{AZN:{name:Azerbaijani manat;symbol:}};{+9;[94]};[Baku];[AZ;Republic of Azerbaijan;Azrbaycan Respublikası];Asia;Western Asia;{aze:Azerbaijani;rus:Russian};{{مهوريةربيان;ربيان};{Republik Azerbaidjan;Azerbaidjan};{zerbájdánská republika;zerbájdán};{Republik Aserbaidschan;Aserbaidschan};{Aserbaidaani Vabariik;Aserbaidaan};{Azerbaidzanin tasavalta;Azerbaidzan};{République d'Azerbaïdjan;Azerbaïdjan};{Republika Azerbajdan;Azerbajdan};{Azerbajdzsán;Azerbajdzsán};{Repubblica dell'Azerbaigian;Azerbaijan};{;};{·;};{Republiek Azerbeidzjan;Azerbeidzjan};{مهوررباان;مهوررباان};{Republika Azerbejdanu;Azerbejdan};{República do Azerbaijão;Azerbeijão};{ераданскаяесулика;ерадан};{Azerbajanská republika;Azerbajan};{República de Azerbaiyán;Azerbaiyán};{Republika Azerbejdan;Azerbejdan};{Republiken Azerbajdzjan;Azerbajdzjan};{Azerbaycan Cumhuriyeti;Azerbaycan};{مورربا�ان;ربا�ان};{;}};[40.5;47.5];true;[ARM;GEO;IRN;RUS;TUR];86600;;{{Azerbaijani;Azerbaijani};{Azerbaïdjanaise;Azerbaïdjanais}}
{Burundi;Republic of Burundi;{fra:{official:République du Burundi;common:Burundi};run:{official:Republika y'Uburundi ;common:Uburundi}}};[.bi];BI;108;BDI;BDI;true;officially-assigned;true;African Group;{BIF:{name:Burundian franc;symbol:Fr}};{+2;[57]};[Gitega];[BI;Republic of Burundi;Republika y'Uburundi;République du Burundi];Africa;Eastern Africa;{fra:French;run:Kirundi};{{مهوريةوروندي;بوروندي};{Republik Burundi;Burundi};{Burundská republika;Burundi};{Republik Burundi;Burundi};{Burundi Vabariik;Burundi};{Burundin tasavalta;Burundi};{République du Burundi;Burundi};{Burundi;Burundi};{Burundi;Burundi};{Repubblica del Burundi;Burundi};{ンジ;ンジ};{;};{Republiek Burundi;Burundi};{مهوروروند;بوروند};{Republika Burundi;Burundi};{República do Burundi;Burundi};{есуликаурунди;урунди};{Burundská republika;Burundi};{República de Burundi;Burundi};{Republika Burundi;Burundi};{Republiken Burundi;Burundi};{Burundi Cumhuriyeti;Burundi};{موررون;برون};{;}};[-3.5;30];true;[COD;RWA;TZA];27834;;{{Burundian;Burundian};{Burundaise;Burundais}}
{Belgium;Kingdom of Belgium;{deu:{official:Königreich Belgien;common:Belgien};fra:{official:Royaume de Belgique;common:Belgique};nld:{official:Koninkrijk België;common:België}}};[.be];BE;056;BEL;BEL;true;officially-assigned;true;Western European and Others Group;{EUR:{name:Euro;symbol:}};{+3;[2]};[Brussels];[BE;België;Belgie;Belgien;Belgique;Kingdom of Belgium;Koninkrijk België;Royaume de Belgique;Königreich Belgien];Europe;Western Europe;{deu:German;fra:French;nld:Dutch};{{مملةليا;بليا};{Rouantelezh Belgia;Belgia};{Belgické království;Belgie};{Königreich Belgien;Belgien};{Belgia Kuningriik;Belgia};{Belgian kuningaskunta;Belgia};{Royaume de Belgique;Belgique};{Kraljevina Belgija;Belgija};{Belga Királyság;Belgium};{Regno del Belgio;Belgio};{;};{;};{Koninkrijk België;België};{ا�اهل;بل};{Królestwo Belgii;Belgia};{Reino da Bélgica;Bélgica};{оро�евствоельия;ельия};{Belgické kráovstvo;Belgicko};{Reino de Bélgica;Bélgica};{Kraljevina Belgija;Belgija};{Konungariket Belgien;Belgien};{Belçika Krallığı;Belçika};{مملتِلم;بلم};{;}};[50.83333333;4];false;[FRA;DEU;LUX;NLD];30528;;{{Belgian;Belgian};{Belge;Belge}}
{Benin;Republic of Benin;{fra:{official:République du Bénin;common:Bénin}}};[.bj];BJ;204;BEN;BEN;true;officially-assigned;true;African Group;{XOF:{name:West African CFA franc;symbol:Fr}};{+2;[29]};[Porto-Novo];[BJ;Republic of Benin;République du Bénin];Africa;Western Africa;{fra:French};{{مهوريةنين;بنين};{Republik Benin;Benin};{Beninská republika;Benin};{Republik Benin;Benin};{Benini Vabariik;Benin};{Beninin tasavalta;Benin};{République du Bénin;Bénin};{Republika Benin;Benin};{Benini Köztársaság;Benin};{Repubblica del Benin;Benin};{;};{·;};{Republiek Benin;Benin};{مهورنن;بنن};{Benin;Benin};{República do Benin;Benin};{есуликаенин;енин};{Beninská republika;Benin};{República de Benin;Benín};{Republika Benin;Benin};{Republiken Benin;Benin};{Benin Cumhuriyeti;Benin};{مورنن;بنن};{;}};[9.5;2.25];false;[BFA;NER;NGA;TGO];112622;;{{Beninese;Beninese};{Béninoise;Béninois}}
{Burkina Faso;Burkina Faso;{fra:{official:République du Burkina;common:Burkina Faso}}};[.bf];BF;854;BFA;BUR;true;officially-assigned;true;African Group;{XOF:{name:West African CFA franc;symbol:Fr}};{+2;[26]};[Ouagadougou];[BF];Africa;Western Africa;{fra:French};{{بوريناا�و;بوريناا�و};{Burkina Faso;Burkina Faso};{Burkina Faso;Burkina Faso};{Burkina Faso;Burkina Faso};{Burkina Faso;Burkina Faso};{Burkina Faso;Burkina Faso};{République du Burkina;Burkina Faso};{Burkina Faso;Burkina Faso};{Burkina Faso;Burkina};{Burkina Faso;Burkina Faso};{ファ;ファ};{;};{Burkina Faso;Burkina Faso};{بورناا�و;بورناا�و};{Burkina Faso;Burkina Faso};{Burkina Faso;Burkina Faso};{уркина -асо;уркина-асо};{Burkina Faso;Burkina Faso};{Burkina Faso;Burkina Faso};{Burkina Faso;Burkina Faso};{Burkina Faso;Burkina Faso};{Burkina Faso;Burkina Faso};{برناا�و;برناا�و};{;}};[13;-2];true;[BEN;CIV;GHA;MLI;NER;TGO];272967;;{{Burkinabe;Burkinabe};{Burkinabée;Burkinabé}}
{Bangladesh;People's Republic of Bangladesh;{ben:{official:·;common:}}};[.bd];BD;050;BGD;BAN;true;officially-assigned;true;Asia and the Pacific Group;{BDT:{name:Bangladeshi taka;symbol:}};{+8;[80]};[Dhaka];[BD;People's Republic of Bangladesh;Gônôprôjatôntri Bangladesh];Asia;Southern Asia;{ben:Bengali};{{مهوريةنلا�ي العبية;بنلا�ي};{Republik pobl Bangladesh;Bangladesh};{Bangladéšská lidová republika;Bangladéš};{Volksrepublik Bangladesch;Bangladesch};{Bangladeshi Rahvavabariik;Bangladesh};{Bangladeshin kansantasavalta;Bangladesh};{Lapublique populaire du Bangladesh;Bangladesh};{Narodna Republika Bangladeš;Bangladeš};{Banglades;Banglades};{Repubblica popolare del Bangladesh;Bangladesh};{;};{·;};{Volksrepubliek Bangladesh;Bangladesh};{مهورلنلا�;بنلا�};{Ludowa Republika Bangladeszu;Bangladesz};{República Popular do Bangladesh;Bangladesh};{аро�наяесуликаанладе;анладе};{Bangladéšskaudová republika;Bangladéš};{República Popular de Bangladesh;Bangladesh};{Narodna Republika Bangladeš;Bangladeš};{Folkrepubliken Bangladesh;Bangladesh};{Bangladeş Halk Cumhuriyeti;Bangladeş};{عواممورنل;بنل};{;}};[24;90];false;[MMR;IND];147570;;{{Bangladeshi;Bangladeshi};{Bangladaise;Bangladais}}
{Bulgaria;Republic of Bulgaria;{bul:{official:еуликалария;common:лария}}};[.bg];BG;100;BGR;BUL;true;officially-assigned;true;Eastern European Group;{BGN:{name:Bulgarian lev;symbol:лв}};{+3;[59]};[Sofia];[BG;Republic of Bulgaria;еуликалария];Europe;Southeast Europe;{bul:Bulgarian};{{مهوريةلاريا;بلاريا};{Republik Bulgaria;Bulgaria};{Bulharská republika;Bulharsko};{Republik Bulgarien;Bulgarien};{Bulgaaria Vabariik;Bulgaaria};{Bulgarian tasavalta;Bulgaria};{République de Bulgarie;Bulgarie};{Republika Bugarska;Bugarska};{Bolgár Köztársaság;Bulgária};{Repubblica di Bulgaria;Bulgaria};{;};{·;};{Republiek Bulgarije;Bulgarije};{مهورلارستان;بلارستان};{Republika Bułgarii;Bułgaria};{República da Bulgária;Bulgária};{есуликао�ария;о�ария};{Bulharská republika;Bulharsko};{República de Bulgaria;Bulgaria};{Republika Bugarska;Bugarska};{Republiken Bulgarien;Bulgarien};{Bulgaristan Cumhuriyeti;Bulgaristan};{مورلار;بلار};{;}};[43;25];false;[GRC;MKD;ROU;SRB;TUR];110879;;{{Bulgarian;Bulgarian};{Bulgare;Bulgare}}
{Bahrain;Kingdom of Bahrain;{ara:{official:مملة البرين;common:البرين}}};[.bh];BH;048;BHR;BRN;true;officially-assigned;true;Asia and the Pacific Group;{BHD:{name:Bahraini dinar;symbol:.د.ب}};{+9;[73]};[Manama];[BH;Kingdom of Bahrain;Mamlakat al-Barayn];Asia;Western Asia;{ara:Arabic};{{مملة البرين;البرين};{Rouantelezh Bahrein;Bahrein};{Království Bahrajn;Bahrajn};{Königreich Bahrain;Bahrain};{Bahreini Kuningriik;Bahrein};{Bahrainin kuningaskunta;Bahrain};{Royaume de Bahreïn;Bahreïn};{Kraljevina Bahrein;Bahrein};{Bahreini Királyság;Bahrein};{Regno del Bahrain;Bahrein};{ー�ーン;ー�ーン};{;};{Koninkrijk Bahrein;Bahrein};{ا�اهرن;برن};{Królestwo Bahrajnu;Bahrajn};{Reino do Bahrein;Bahrein};{оро�евствоарен;арен};{Bahrajnské kráovstvo;Bahrajn};{Reino de Bahrein;Bahrein};{Kraljevina Bahrein;Bahrein};{Konungariket Bahrain;Bahrain};{Bahreyn Krallığı;Bahreyn};{مملتِرن;برن};{;}};[26;50.55];false;[];765;;{{Bahraini;Bahraini};{Bahreïnienne;Bahreïnien}}
... (truncated)
large_non_uniform_nested_mixed.json — Original: 2402 chars — Tokenizer: gpt2 (openai-community/gpt2)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)2,4021,2921.91.9
JSON (min)1,5004465.43.4
CSVN/A
TSVN/A
YAML1,5736613.62.4
TOON1,7668412.92.1
TSON1,2755254.62.4
minemizer1,2033836.33.1
minemizer (compact)1,0724095.92.6
JSON (pretty)
chars: 2,402 tokens: 1,292 chars_og/tok: 1.9 enc_chars/tok: 1.9
[
· {
··· "id": 1,
··· "name": "Alice",
··· "work": {
····· "title": "Senior Engineer",
····· "years": 5,
····· "remote": true,
····· "team": "Platform"
··· },
··· "contact": {
····· "email": "alice@co.com"
··· }
· },
· {
··· "id": 2,
··· "profile": {
····· "age": 28,
····· "city": "NYC",
····· "verified": true
··· },
··· "status": "active",
··· "permissions": {
····· "admin": false,
····· "editor": true
... (truncated)
JSON (min)
chars: 1,500 tokens: 446 chars_og/tok: 5.4 enc_chars/tok: 3.4
[{"id":1,"name":"Alice","work":{"title":"Senior Engineer","years":5,"remote":true,"team":"Platform"},"contact":{"email":"alice@co.com"}},{"id":2,"profile":{"age":28,"city":"NYC","verified":true},"status":"active","permissions":{"admin":false,"editor":true}},{"id":3,"name":"Charlie","contact":{"email":"c@example.com","preferred":"email","phone":"555-0103"},"metadata":{"created":"2019-06-10"}},{"id":4,"user":{"username":"diana","role":"admin","level":5},"metadata":{"created":"2020-09-01","updated":"2024-01-20"},"settings":{"theme":"dark"}},{"id":5,"employee":{"name":"Eve Adams","department":"Sales"},"performance":{"score":85,"reviews":3},"contact":{"email":"eve@co.com","slack":"@eve"}},{"id":6,"name":"Frank","work":{"title":"Product Manager","years":8,"remote":false,"team":"Growth"},"contact":{"email":"frank@co.com","phone":"555-0106"}},{"id":7,"profile":{"age":35,"city":"LA","verified":false},"status":"inactive","permissions":{"admin":true,"editor":false},"metadata":{"created":"2018-03-15"}},{"id":8,"name":"Grace","contact":{"email":"grace@example.org","preferred":"slack","slack":"@grace"},"settings":{"theme":"light","notifications":true}},{"id":9,"user":{"username":"henry","role":"viewer","level":2},"employee":{"name":"Henry Wilson","department":"Marketing"},"performance":{"score":72,"reviews":5}},{"id":10,"name":"Iris","work":{"title":"Designer","years":3,"remote":true,"team":"Creative"},"profile":{"age":26,"city":"Austin","verified":true},"contact":{"email":"iris@co.com"}}]
CSV: N/A
TSV: N/A
YAML
chars: 1,573 tokens: 661 chars_og/tok: 3.6 enc_chars/tok: 2.4
- contact:
··· email: alice@co.com
· id: 1
· name: Alice
· work:
··· remote: true
··· team: Platform
··· title: Senior Engineer
··· years: 5
- id: 2
· permissions:
··· admin: false
··· editor: true
· profile:
··· age: 28
··· city: NYC
··· verified: true
· status: active
- contact:
··· email: c@example.com
··· phone: 555-0103
··· preferred: email
· id: 3
· metadata:
··· created: '2019-06-10'
... (truncated)
TOON
chars: 1,766 tokens: 841 chars_og/tok: 2.9 enc_chars/tok: 2.1
[10]:
· - id: 1
··· name: Alice
··· work:
····· title: Senior Engineer
····· years: 5
····· remote: true
····· team: Platform
··· contact:
····· email: alice@co.com
· - id: 2
··· profile:
····· age: 28
····· city: NYC
····· verified: true
··· status: active
··· permissions:
····· admin: false
····· editor: true
· - id: 3
··· name: Charlie
··· contact:
····· email: c@example.com
····· preferred: email
····· phone: 555-0103
... (truncated)
TSON
chars: 1,275 tokens: 525 chars_og/tok: 4.6 enc_chars/tok: 2.4
[{@id,name,work,contact|1,Alice,{@title,years,remote,team|"Senior Engineer",5,true,Platform},{@email|"alice@co.com"}},{@id,profile,status,permissions|2,{@age,city,verified|28,NYC,true},active,{@admin,editor|false,true}},{@id,name,contact,metadata|3,Charlie,{@email,preferred,phone|"c@example.com",email,555-0103},{@created|2019-06-10}},{@id,user,metadata,settings|4,{@username,role,level|diana,admin,5},{@created,updated|2020-09-01,2024-01-20},{@theme|dark}},{@id,employee,performance,contact|5,{@name,department|"Eve Adams",Sales},{@score,reviews|85,3},{@email,slack|"eve@co.com","@eve"}},{@id,name,work,contact|6,Frank,{@title,years,remote,team|"Product Manager",8,false,Growth},{@email,phone|"frank@co.com",555-0106}},{@id,profile,status,permissions,metadata|7,{@age,city,verified|35,LA,false},inactive,{@admin,editor|true,false},{@created|2018-03-15}},{@id,name,contact,settings|8,Grace,{@email,preferred,slack|"grace@example.org",slack,"@grace"},{@theme,notifications|light,true}},{@id,user,employee,performance|9,{@username,role,level|henry,viewer,2},{@name,department|"Henry Wilson",Marketing},{@score,reviews|72,5}},{@id,name,work,profile,contact|10,Iris,{@title,years,remote,team|Designer,3,true,Creative},{@age,city,verified|26,Austin,true},{@email|"iris@co.com"}}]
minemizer
chars: 1,203 tokens: 383 chars_og/tok: 6.3 enc_chars/tok: 3.1
id; name; contact{ email; ...}
1; Alice;{ alice@co.com}; work{ title: Senior Engineer; years: 5; remote:true; team: Platform}
2;;; profile{ age: 28; city: NYC; verified:true}; status: active; permissions{ admin:false; editor:true}
3; Charlie;{ c@example.com; preferred: email; phone: 555-0103}; metadata{ created: 2019-06-10}
4;;; user{ username: diana; role: admin; level: 5}; metadata{ created: 2020-09-01; updated: 2024-01-20}; settings{ theme: dark}
5;;{ eve@co.com; slack: @eve}; employee{ name: Eve Adams; department: Sales}; performance{ score: 85; reviews: 3}
6; Frank;{ frank@co.com; phone: 555-0106}; work{ title: Product Manager; years: 8; remote:false; team: Growth}
7;;; profile{ age: 35; city: LA; verified:false}; status: inactive; permissions{ admin:true; editor:false}; metadata{ created: 2018-03-15}
8; Grace;{ grace@example.org; preferred: slack; slack: @grace}; settings{ theme: light; notifications:true}
9;;; user{ username: henry; role: viewer; level: 2}; employee{ name: Henry Wilson; department: Marketing}; performance{ score: 72; reviews: 5}
10; Iris;{ iris@co.com}; work{ title: Designer; years: 3; remote:true; team: Creative}; profile{ age: 26; city: Austin; verified:true}
minemizer (compact)
chars: 1,072 tokens: 409 chars_og/tok: 5.9 enc_chars/tok: 2.6
id;name;contact{email;...}
1;Alice;{alice@co.com};work{title:Senior Engineer;years:5;remote:true;team:Platform}
2;;;profile{age:28;city:NYC;verified:true};status:active;permissions{admin:false;editor:true}
3;Charlie;{c@example.com;preferred:email;phone:555-0103};metadata{created:2019-06-10}
4;;;user{username:diana;role:admin;level:5};metadata{created:2020-09-01;updated:2024-01-20};settings{theme:dark}
5;;{eve@co.com;slack:@eve};employee{name:Eve Adams;department:Sales};performance{score:85;reviews:3}
6;Frank;{frank@co.com;phone:555-0106};work{title:Product Manager;years:8;remote:false;team:Growth}
7;;;profile{age:35;city:LA;verified:false};status:inactive;permissions{admin:true;editor:false};metadata{created:2018-03-15}
8;Grace;{grace@example.org;preferred:slack;slack:@grace};settings{theme:light;notifications:true}
9;;;user{username:henry;role:viewer;level:2};employee{name:Henry Wilson;department:Marketing};performance{score:72;reviews:5}
10;Iris;{iris@co.com};work{title:Designer;years:3;remote:true;team:Creative};profile{age:26;city:Austin;verified:true}
large_non_uniform_nested_numerical.json — Original: 2947 chars — Tokenizer: gpt2 (openai-community/gpt2)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)2,9471,7181.71.7
JSON (min)1,8737553.92.5
CSVN/A
TSVN/A
YAML2,0851,0332.92.0
TOON2,3181,2492.41.9
TSON1,6428233.62.0
minemizer1,5346324.72.4
minemizer (compact)1,3616764.42.0
JSON (pretty)
chars: 2,947 tokens: 1,718 chars_og/tok: 1.7 enc_chars/tok: 1.7
[
· {
··· "id": 1,
··· "metrics": {
····· "views": 15420,
····· "clicks": 842,
····· "ctr": 0.0546,
····· "bounce_rate": 0.32
··· },
··· "revenue": {
····· "amount": 12499.99,
····· "currency_rate": 1.0
··· },
··· "timestamp": "2024-01-15T09:30:00Z"
· },
· {
··· "id": 2,
··· "metrics": {
····· "views": 8923,
····· "clicks": 156,
····· "ctr": 0.0175,
····· "bounce_rate": 0.67
··· },
··· "stats": {
····· "avg_time": 45.7,
... (truncated)
JSON (min)
chars: 1,873 tokens: 755 chars_og/tok: 3.9 enc_chars/tok: 2.5
[{"id":1,"metrics":{"views":15420,"clicks":842,"ctr":0.0546,"bounce_rate":0.32},"revenue":{"amount":12499.99,"currency_rate":1.0},"timestamp":"2024-01-15T09:30:00Z"},{"id":2,"metrics":{"views":8923,"clicks":156,"ctr":0.0175,"bounce_rate":0.67},"stats":{"avg_time":45.7,"pages_per_session":2.3,"return_rate":0.15},"timestamp":"2024-01-16T14:22:33Z"},{"id":3,"revenue":{"amount":8750.5,"tax":700.04,"net":8050.46,"currency_rate":0.92},"inventory":{"count":342,"reserved":28,"available":314}},{"id":4,"metrics":{"views":52100,"clicks":3891,"ctr":0.0747,"bounce_rate":0.21},"performance":{"latency_ms":127.5,"uptime":0.9987,"errors":3},"timestamp":"2024-01-17T08:00:00Z"},{"id":5,"stats":{"avg_time":128.9,"pages_per_session":5.7,"return_rate":0.42},"scores":{"quality":94,"relevance":87,"engagement":0.78},"dates":{"start":"2023-06-01","end":"2024-01-31"}},{"id":6,"inventory":{"count":1205,"reserved":89,"available":1116,"reorder_point":200},"pricing":{"cost":24.99,"markup":0.35,"price":33.74},"timestamp":"2024-01-18T11:45:12Z"},{"id":7,"metrics":{"views":3156,"clicks":98,"ctr":0.031,"bounce_rate":0.55},"revenue":{"amount":2150.0,"tax":172.0,"net":1978.0},"performance":{"latency_ms":89.2,"uptime":0.9995,"errors":0}},{"id":8,"scores":{"quality":78,"relevance":92,"engagement":0.65,"nps":45},"dates":{"start":"2022-11-15","end":"2024-02-28","renewal":"2024-03-01"},"budget":{"allocated":50000,"spent":42350.75,"remaining":7649.25}},{"id":9,"pricing":{"cost":149.99,"markup":0.28,"price":191.99,"discount":0.1},"inventory":{"count":56,"reserved":12,"available":44},"timestamp":"2024-01-19T16:30:45Z"},{"id":10,"metrics":{"views":128750,"clicks":9823,"ctr":0.0763,"bounce_rate":0.18},"stats":{"avg_time":312.4,"pages_per_session":8.2,"return_rate":0.58},"budget":{"allocated":125000,"spent":98420.33,"remaining":26579.67},"dates":{"start":"2023-01-01","end":"2024-12-31"}}]
CSV: N/A
TSV: N/A
YAML
chars: 2,085 tokens: 1,033 chars_og/tok: 2.9 enc_chars/tok: 2.0
- id: 1
· metrics:
··· bounce_rate: 0.32
··· clicks: 842
··· ctr: 0.0546
··· views: 15420
· revenue:
··· amount: 12499.99
··· currency_rate: 1.0
· timestamp: '2024-01-15T09:30:00Z'
- id: 2
· metrics:
··· bounce_rate: 0.67
··· clicks: 156
··· ctr: 0.0175
··· views: 8923
· stats:
··· avg_time: 45.7
··· pages_per_session: 2.3
··· return_rate: 0.15
· timestamp: '2024-01-16T14:22:33Z'
- id: 3
· inventory:
··· available: 314
··· count: 342
... (truncated)
TOON
chars: 2,318 tokens: 1,249 chars_og/tok: 2.4 enc_chars/tok: 1.9
[10]:
· - id: 1
··· metrics:
····· views: 15420
····· clicks: 842
····· ctr: 0.0546
····· bounce_rate: 0.32
··· revenue:
····· amount: 12499.99
····· currency_rate: 1.0
··· timestamp: "2024-01-15T09:30:00Z"
· - id: 2
··· metrics:
····· views: 8923
····· clicks: 156
····· ctr: 0.0175
····· bounce_rate: 0.67
··· stats:
····· avg_time: 45.7
····· pages_per_session: 2.3
····· return_rate: 0.15
··· timestamp: "2024-01-16T14:22:33Z"
· - id: 3
··· revenue:
····· amount: 8750.5
... (truncated)
TSON
chars: 1,642 tokens: 823 chars_og/tok: 3.6 enc_chars/tok: 2.0
[{@id,metrics,revenue,timestamp|1,{@views,clicks,ctr,bounce_rate|15420,842,0.0546,0.32},{@amount,currency_rate|12499.99,1.0},2024-01-15T09:30:00Z},{@id,metrics,stats,timestamp|2,{@views,clicks,ctr,bounce_rate|8923,156,0.0175,0.67},{@avg_time,pages_per_session,return_rate|45.7,2.3,0.15},2024-01-16T14:22:33Z},{@id,revenue,inventory|3,{@amount,tax,net,currency_rate|8750.5,700.04,8050.46,0.92},{@count,reserved,available|342,28,314}},{@id,metrics,performance,timestamp|4,{@views,clicks,ctr,bounce_rate|52100,3891,0.0747,0.21},{@latency_ms,uptime,errors|127.5,0.9987,3},2024-01-17T08:00:00Z},{@id,stats,scores,dates|5,{@avg_time,pages_per_session,return_rate|128.9,5.7,0.42},{@quality,relevance,engagement|94,87,0.78},{@start,end|2023-06-01,2024-01-31}},{@id,inventory,pricing,timestamp|6,{@count,reserved,available,reorder_point|1205,89,1116,200},{@cost,markup,price|24.99,0.35,33.74},2024-01-18T11:45:12Z},{@id,metrics,revenue,performance|7,{@views,clicks,ctr,bounce_rate|3156,98,0.031,0.55},{@amount,tax,net|2150.0,172.0,1978.0},{@latency_ms,uptime,errors|89.2,0.9995,0}},{@id,scores,dates,budget|8,{@quality,relevance,engagement,nps|78,92,0.65,45},{@start,end,renewal|2022-11-15,2024-02-28,2024-03-01},{@allocated,spent,remaining|50000,42350.75,7649.25}},{@id,pricing,inventory,timestamp|9,{@cost,markup,price,discount|149.99,0.28,191.99,0.1},{@count,reserved,available|56,12,44},2024-01-19T16:30:45Z},{@id,metrics,stats,budget,dates|10,{@views,clicks,ctr,bounce_rate|128750,9823,0.0763,0.18},{@avg_time,pages_per_session,return_rate|312.4,8.2,0.58},{@allocated,spent,remaining|125000,98420.33,26579.67},{@start,end|2023-01-01,2024-12-31}}]
minemizer
chars: 1,534 tokens: 632 chars_og/tok: 4.7 enc_chars/tok: 2.4
id; metrics{ views; clicks; ctr; bounce_rate}; timestamp
1;{ 15420; 842; 0.0546; 0.32}; 2024-01-15T09:30:00Z; revenue{ amount: 12499.99; currency_rate: 1.0}
2;{ 8923; 156; 0.0175; 0.67}; 2024-01-16T14:22:33Z; stats{ avg_time: 45.7; pages_per_session: 2.3; return_rate: 0.15}
3;;; revenue{ amount: 8750.5; tax: 700.04; net: 8050.46; currency_rate: 0.92}; inventory{ count: 342; reserved: 28; available: 314}
4;{ 52100; 3891; 0.0747; 0.21}; 2024-01-17T08:00:00Z; performance{ latency_ms: 127.5; uptime: 0.9987; errors: 3}
5;;; stats{ avg_time: 128.9; pages_per_session: 5.7; return_rate: 0.42}; scores{ quality: 94; relevance: 87; engagement: 0.78}; dates{ start: 2023-06-01; end: 2024-01-31}
6;; 2024-01-18T11:45:12Z; inventory{ count: 1205; reserved: 89; available: 1116; reorder_point: 200}; pricing{ cost: 24.99; markup: 0.35; price: 33.74}
7;{ 3156; 98; 0.031; 0.55};; revenue{ amount: 2150.0; tax: 172.0; net: 1978.0}; performance{ latency_ms: 89.2; uptime: 0.9995; errors: 0}
8;;; scores{ quality: 78; relevance: 92; engagement: 0.65; nps: 45}; dates{ start: 2022-11-15; end: 2024-02-28; renewal: 2024-03-01}; budget{ allocated: 50000; spent: 42350.75; remaining: 7649.25}
9;; 2024-01-19T16:30:45Z; pricing{ cost: 149.99; markup: 0.28; price: 191.99; discount: 0.1}; inventory{ count: 56; reserved: 12; available: 44}
10;{ 128750; 9823; 0.0763; 0.18};; stats{ avg_time: 312.4; pages_per_session: 8.2; return_rate: 0.58}; budget{ allocated: 125000; spent: 98420.33; remaining: 26579.67}; dates{ start: 2023-01-01; end: 2024-12-31}
minemizer (compact)
chars: 1,361 tokens: 676 chars_og/tok: 4.4 enc_chars/tok: 2.0
id;metrics{views;clicks;ctr;bounce_rate};timestamp
1;{15420;842;0.0546;0.32};2024-01-15T09:30:00Z;revenue{amount:12499.99;currency_rate:1.0}
2;{8923;156;0.0175;0.67};2024-01-16T14:22:33Z;stats{avg_time:45.7;pages_per_session:2.3;return_rate:0.15}
3;;;revenue{amount:8750.5;tax:700.04;net:8050.46;currency_rate:0.92};inventory{count:342;reserved:28;available:314}
4;{52100;3891;0.0747;0.21};2024-01-17T08:00:00Z;performance{latency_ms:127.5;uptime:0.9987;errors:3}
5;;;stats{avg_time:128.9;pages_per_session:5.7;return_rate:0.42};scores{quality:94;relevance:87;engagement:0.78};dates{start:2023-06-01;end:2024-01-31}
6;;2024-01-18T11:45:12Z;inventory{count:1205;reserved:89;available:1116;reorder_point:200};pricing{cost:24.99;markup:0.35;price:33.74}
7;{3156;98;0.031;0.55};;revenue{amount:2150.0;tax:172.0;net:1978.0};performance{latency_ms:89.2;uptime:0.9995;errors:0}
8;;;scores{quality:78;relevance:92;engagement:0.65;nps:45};dates{start:2022-11-15;end:2024-02-28;renewal:2024-03-01};budget{allocated:50000;spent:42350.75;remaining:7649.25}
9;;2024-01-19T16:30:45Z;pricing{cost:149.99;markup:0.28;price:191.99;discount:0.1};inventory{count:56;reserved:12;available:44}
10;{128750;9823;0.0763;0.18};;stats{avg_time:312.4;pages_per_session:8.2;return_rate:0.58};budget{allocated:125000;spent:98420.33;remaining:26579.67};dates{start:2023-01-01;end:2024-12-31}
large_non_uniform_nested_text.json — Original: 4214 chars — Tokenizer: gpt2 (openai-community/gpt2)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)4,2141,4982.82.8
JSON (min)3,3596586.45.1
CSVN/A
TSVN/A
YAML3,3878185.24.1
TOON3,5349744.33.6
TSON3,1737215.84.4
minemizer2,8095228.15.4
minemizer (compact)2,6945657.54.8
JSON (pretty)
chars: 4,214 tokens: 1,498 chars_og/tok: 2.8 enc_chars/tok: 2.8
[
· {
··· "id": 1,
··· "title": "Introduction to Machine Learning",
··· "author": {
····· "name": "Dr. Sarah Chen",
····· "affiliation": "Stanford University",
····· "department": "Computer Science"
··· },
··· "abstract": "A comprehensive overview of modern machine learning techniques and applications",
··· "tags": [
····· "AI",
····· "ML",
····· "deep learning"
··· ]
· },
· {
··· "id": 2,
··· "title": "Climate Change Impact Assessment",
··· "content": {
····· "summary": "Analysis of rising sea levels and temperature patterns",
····· "methodology": "longitudinal study with satellite imagery",
····· "conclusion": "significant acceleration observed since 2010"
··· },
··· "category": "Environmental Science"
... (truncated)
JSON (min)
chars: 3,359 tokens: 658 chars_og/tok: 6.4 enc_chars/tok: 5.1
[{"id":1,"title":"Introduction to Machine Learning","author":{"name":"Dr. Sarah Chen","affiliation":"Stanford University","department":"Computer Science"},"abstract":"A comprehensive overview of modern machine learning techniques and applications","tags":["AI","ML","deep learning"]},{"id":2,"title":"Climate Change Impact Assessment","content":{"summary":"Analysis of rising sea levels and temperature patterns","methodology":"longitudinal study with satellite imagery","conclusion":"significant acceleration observed since 2010"},"category":"Environmental Science"},{"id":3,"author":{"name":"Marcus Williams","affiliation":"MIT Media Lab","role":"Principal Researcher"},"publication":{"journal":"Nature Communications","volume":"fifteen","status":"peer-reviewed"},"keywords":"quantum computing, error correction, fault tolerance"},{"id":4,"title":"Urban Planning Strategies for Sustainable Cities","abstract":"Examining green infrastructure and mixed-use development patterns","content":{"summary":"Case studies from Copenhagen, Singapore, and Portland","methodology":"comparative analysis with community surveys","findings":"walkability correlates strongly with resident satisfaction"},"tags":["urban design","sustainability","planning"]},{"id":5,"publication":{"journal":"The Lancet","volume":"four hundred two","issue":"special edition","status":"published"},"content":{"summary":"Global health outcomes following pandemic response measures","conclusion":"early intervention strategies proved most effective"},"category":"Public Health"},{"id":6,"title":"Advances in Natural Language Processing","author":{"name":"Dr. James Rodriguez","affiliation":"Google Research","department":"Language Understanding"},"abstract":"Survey of transformer architectures and attention mechanisms in modern NLP systems","keywords":"transformers, attention, language models, BERT, GPT"},{"id":7,"content":{"summary":"Historical analysis of economic policy shifts in emerging markets","methodology":"archival research combined with econometric modeling","findings":"trade liberalization showed mixed results across regions","limitations":"data availability constraints for pre-1990 period"},"category":"Economics","tags":["policy","trade","development"]},{"id":8,"title":"Biodiversity Conservation in Tropical Rainforests","author":{"name":"Dr. Ana Costa","affiliation":"Brazilian Institute for Amazonian Research","role":"Lead Ecologist"},"publication":{"journal":"Conservation Biology","status":"under review"},"abstract":"Mapping species distribution patterns and identifying critical habitat corridors"},{"id":9,"title":"Behavioral Economics and Consumer Decision Making","content":{"summary":"Experimental studies on cognitive biases in purchasing behavior","methodology":"randomized controlled trials with eye-tracking technology","conclusion":"anchoring effects persist even with expert consumers"},"keywords":"behavioral economics, decision theory, consumer psychology","category":"Psychology"},{"id":10,"author":{"name":"Prof. Michael Thompson","affiliation":"Oxford University","department":"Engineering Science","role":"Department Chair"},"publication":{"journal":"Advanced Materials","volume":"thirty-six","status":"accepted"},"abstract":"Novel synthesis methods for high-performance ceramic composites","tags":["materials science","ceramics","nanotechnology"]}]
CSV: N/A
TSV: N/A
YAML
chars: 3,387 tokens: 818 chars_og/tok: 5.2 enc_chars/tok: 4.1
- abstract: A comprehensive overview of modern machine learning techniques and applications
· author:
··· affiliation: Stanford University
··· department: Computer Science
··· name: Dr. Sarah Chen
· id: 1
· tags:
· - AI
· - ML
· - deep learning
· title: Introduction to Machine Learning
- category: Environmental Science
· content:
··· conclusion: significant acceleration observed since 2010
··· methodology: longitudinal study with satellite imagery
··· summary: Analysis of rising sea levels and temperature patterns
· id: 2
· title: Climate Change Impact Assessment
- author:
··· affiliation: MIT Media Lab
··· name: Marcus Williams
··· role: Principal Researcher
· id: 3
· keywords: quantum computing, error correction, fault tolerance
· publication:
... (truncated)
TOON
chars: 3,534 tokens: 974 chars_og/tok: 4.3 enc_chars/tok: 3.6
[10]:
· - id: 1
··· title: Introduction to Machine Learning
··· author:
····· name: Dr. Sarah Chen
····· affiliation: Stanford University
····· department: Computer Science
··· abstract: A comprehensive overview of modern machine learning techniques and applications
··· tags[3]: AI,ML,deep learning
· - id: 2
··· title: Climate Change Impact Assessment
··· content:
····· summary: Analysis of rising sea levels and temperature patterns
····· methodology: longitudinal study with satellite imagery
····· conclusion: significant acceleration observed since 2010
··· category: Environmental Science
· - id: 3
··· author:
····· name: Marcus Williams
····· affiliation: MIT Media Lab
····· role: Principal Researcher
··· publication:
····· journal: Nature Communications
····· volume: fifteen
····· status: peer-reviewed
... (truncated)
TSON
chars: 3,173 tokens: 721 chars_og/tok: 5.8 enc_chars/tok: 4.4
[{@id,title,author,abstract,tags|1,"Introduction to Machine Learning",{@name,affiliation,department|"Dr. Sarah Chen","Stanford University","Computer Science"},"A comprehensive overview of modern machine learning techniques and applications",[AI,ML,"deep learning"]},{@id,title,content,category|2,"Climate Change Impact Assessment",{@summary,methodology,conclusion|"Analysis of rising sea levels and temperature patterns","longitudinal study with satellite imagery","significant acceleration observed since 2010"},"Environmental Science"},{@id,author,publication,keywords|3,{@name,affiliation,role|"Marcus Williams","MIT Media Lab","Principal Researcher"},{@journal,volume,status|"Nature Communications",fifteen,peer-reviewed},"quantum computing, error correction, fault tolerance"},{@id,title,abstract,content,tags|4,"Urban Planning Strategies for Sustainable Cities","Examining green infrastructure and mixed-use development patterns",{@summary,methodology,findings|"Case studies from Copenhagen, Singapore, and Portland","comparative analysis with community surveys","walkability correlates strongly with resident satisfaction"},["urban design",sustainability,planning]},{@id,publication,content,category|5,{@journal,volume,issue,status|"The Lancet","four hundred two","special edition",published},{@summary,conclusion|"Global health outcomes following pandemic response measures","early intervention strategies proved most effective"},"Public Health"},{@id,title,author,abstract,keywords|6,"Advances in Natural Language Processing",{@name,affiliation,department|"Dr. James Rodriguez","Google Research","Language Understanding"},"Survey of transformer architectures and attention mechanisms in modern NLP systems","transformers, attention, language models, BERT, GPT"},{@id,content,category,tags|7,{@summary,methodology,findings,limitations|"Historical analysis of economic policy shifts in emerging markets","archival research combined with econometric modeling","trade liberalization showed mixed results across regions","data availability constraints for pre-1990 period"},Economics,[policy,trade,development]},{@id,title,author,publication,abstract|8,"Biodiversity Conservation in Tropical Rainforests",{@name,affiliation,role|"Dr. Ana Costa","Brazilian Institute for Amazonian Research","Lead Ecologist"},{@journal,status|"Conservation Biology","under review"},"Mapping species distribution patterns and identifying critical habitat corridors"},{@id,title,content,keywords,category|9,"Behavioral Economics and Consumer Decision Making",{@summary,methodology,conclusion|"Experimental studies on cognitive biases in purchasing behavior","randomized controlled trials with eye-tracking technology","anchoring effects persist even with expert consumers"},"behavioral economics, decision theory, consumer psychology",Psychology},{@id,author,publication,abstract,tags|10,{@name,affiliation,department,role|"Prof. Michael Thompson","Oxford University","Engineering Science","Department Chair"},{@journal,volume,status|"Advanced Materials",thirty-six,accepted},"Novel synthesis methods for high-performance ceramic composites",["materials science",ceramics,nanotechnology]}]
minemizer
chars: 2,809 tokens: 522 chars_og/tok: 8.1 enc_chars/tok: 5.4
id; title; author{ name; affiliation; department; role}; abstract; content{ summary; methodology; conclusion; ...}
1; Introduction to Machine Learning;{ Dr. Sarah Chen; Stanford University; Computer Science;}; A comprehensive overview of modern machine learning techniques and applications;; tags[ AI; ML; deep learning]
2; Climate Change Impact Assessment;;;{ Analysis of rising sea levels and temperature patterns; longitudinal study with satellite imagery; significant acceleration observed since 2010}; category: Environmental Science
3;;{ Marcus Williams; MIT Media Lab;; Principal Researcher};;; publication{ journal: Nature Communications; volume: fifteen; status: peer-reviewed}; keywords: quantum computing, error correction, fault tolerance
4; Urban Planning Strategies for Sustainable Cities;; Examining green infrastructure and mixed-use development patterns;{ Case studies from Copenhagen, Singapore, and Portland; comparative analysis with community surveys;; findings: walkability correlates strongly with resident satisfaction}; tags[ urban design; sustainability; planning]
5;;;;{ Global health outcomes following pandemic response measures;; early intervention strategies proved most effective}; publication{ journal: The Lancet; volume: four hundred two; issue: special edition; status: published}; category: Public Health
6; Advances in Natural Language Processing;{ Dr. James Rodriguez; Google Research; Language Understanding;}; Survey of transformer architectures and attention mechanisms in modern NLP systems;; keywords: transformers, attention, language models, BERT, GPT
7;;;;{ Historical analysis of economic policy shifts in emerging markets; archival research combined with econometric modeling;; findings: trade liberalization showed mixed results across regions; limitations: data availability constraints for pre-1990 period}; category: Economics; tags[ policy; trade; development]
8; Biodiversity Conservation in Tropical Rainforests;{ Dr. Ana Costa; Brazilian Institute for Amazonian Research;; Lead Ecologist}; Mapping species distribution patterns and identifying critical habitat corridors;; publication{ journal: Conservation Biology; status: under review}
9; Behavioral Economics and Consumer Decision Making;;;{ Experimental studies on cognitive biases in purchasing behavior; randomized controlled trials with eye-tracking technology; anchoring effects persist even with expert consumers}; keywords: behavioral economics, decision theory, consumer psychology; category: Psychology
10;;{ Prof. Michael Thompson; Oxford University; Engineering Science; Department Chair}; Novel synthesis methods for high-performance ceramic composites;; publication{ journal: Advanced Materials; volume: thirty-six; status: accepted}; tags[ materials science; ceramics; nanotechnology]
minemizer (compact)
chars: 2,694 tokens: 565 chars_og/tok: 7.5 enc_chars/tok: 4.8
id;title;author{name;affiliation;department;role};abstract;content{summary;methodology;conclusion;...}
1;Introduction to Machine Learning;{Dr. Sarah Chen;Stanford University;Computer Science;};A comprehensive overview of modern machine learning techniques and applications;;tags[AI;ML;deep learning]
2;Climate Change Impact Assessment;;;{Analysis of rising sea levels and temperature patterns;longitudinal study with satellite imagery;significant acceleration observed since 2010};category:Environmental Science
3;;{Marcus Williams;MIT Media Lab;;Principal Researcher};;;publication{journal:Nature Communications;volume:fifteen;status:peer-reviewed};keywords:quantum computing, error correction, fault tolerance
4;Urban Planning Strategies for Sustainable Cities;;Examining green infrastructure and mixed-use development patterns;{Case studies from Copenhagen, Singapore, and Portland;comparative analysis with community surveys;;findings:walkability correlates strongly with resident satisfaction};tags[urban design;sustainability;planning]
5;;;;{Global health outcomes following pandemic response measures;;early intervention strategies proved most effective};publication{journal:The Lancet;volume:four hundred two;issue:special edition;status:published};category:Public Health
6;Advances in Natural Language Processing;{Dr. James Rodriguez;Google Research;Language Understanding;};Survey of transformer architectures and attention mechanisms in modern NLP systems;;keywords:transformers, attention, language models, BERT, GPT
7;;;;{Historical analysis of economic policy shifts in emerging markets;archival research combined with econometric modeling;;findings:trade liberalization showed mixed results across regions;limitations:data availability constraints for pre-1990 period};category:Economics;tags[policy;trade;development]
8;Biodiversity Conservation in Tropical Rainforests;{Dr. Ana Costa;Brazilian Institute for Amazonian Research;;Lead Ecologist};Mapping species distribution patterns and identifying critical habitat corridors;;publication{journal:Conservation Biology;status:under review}
9;Behavioral Economics and Consumer Decision Making;;;{Experimental studies on cognitive biases in purchasing behavior;randomized controlled trials with eye-tracking technology;anchoring effects persist even with expert consumers};keywords:behavioral economics, decision theory, consumer psychology;category:Psychology
10;;{Prof. Michael Thompson;Oxford University;Engineering Science;Department Chair};Novel synthesis methods for high-performance ceramic composites;;publication{journal:Advanced Materials;volume:thirty-six;status:accepted};tags[materials science;ceramics;nanotechnology]
mcp_tools_list.json — Original: 51663 chars — Tokenizer: gpt2 (openai-community/gpt2)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)51,66327,5741.91.9
JSON (min)30,7246,8407.64.5
CSVN/A
TSVN/A
YAML38,13916,7703.12.3
TOON38,37617,2963.02.2
TSON25,8787,3187.13.5
minemizer23,3835,5599.34.2
minemizer (compact)21,9125,6729.13.9
JSON (pretty)
chars: 51,663 tokens: 27,574 chars_og/tok: 1.9 enc_chars/tok: 1.9
[
· {
··· "inputSchema": {
····· "json": {
······· "properties": {
········· "body": {
··········· "description": "Comment content",
··········· "type": "string"
········· },
········· "issue_number": {
··········· "description": "Issue number to comment on",
··········· "type": "number"
········· },
········· "owner": {
··········· "description": "Repository owner",
··········· "type": "string"
········· },
········· "repo": {
··········· "description": "Repository name",
··········· "type": "string"
········· }
······· },
······· "required": [
········· "owner",
········· "repo",
... (truncated)
JSON (min)
chars: 30,724 tokens: 6,840 chars_og/tok: 7.6 enc_chars/tok: 4.5
[{"inputSchema":{"json":{"properties":{"body":{"description":"Comment content","type":"string"},"issue_number":{"description":"Issue number to comment on","type":"number"},"owner":{"description":"Repository owner","type":"string"},"repo":{"description":"Repository name","type":"string"}},"required":["owner","repo","issue_number","body"],"type":"object"}},"name":"add_issue_comment","description":"Add a comment to a specific issue in a GitHub repository."},{"inputSchema":{"json":{"properties":{"body":{"description":"The text of the review comment","type":"string"},"line":{"description":"The line of the blob in the pull request diff that the comment applies to. For multi-line comments, the last line of the range","type":"number"},"owner":{"description":"Repository owner","type":"string"},"path":{"description":"The relative path to the file that necessitates a comment","type":"string"},"pullNumber":{"description":"Pull request number","type":"number"},"repo":{"description":"Repository name","type":"string"},"side":{"description":"The side of the diff to comment on. LEFT indicates the previous state, RIGHT indicates the new state","enum":["LEFT","RIGHT"],"type":"string"},"startLine":{"description":"For multi-line comments, the first line of the range that the comment applies to","type":"number"},"startSide":{"description":"For multi-line comments, the starting side of the diff that the comment applies to. LEFT indicates the previous state, RIGHT indicates the new state","enum":["LEFT","RIGHT"],"type":"string"},"subjectType":{"description":"The level at which the comment is targeted","enum":["FILE","LINE"],"type":"string"}},"required":["owner","repo","pullNumber","path","body","subjectType"],"type":"object"}},"name":"add_pull_request_review_comment_to_pending_review","description":"Add a comment to the requester's latest pending pull request review, a pending review needs to already exist to call this (check with the user if not sure)."},{"inputSchema":{"json":{"properties":{"issueNumber":{"description":"Issue number","type":"number"},"owner":{"description":"Repository owner","type":"string"},"repo":{"description":"Repository name","type":"string"}},"required":["owner","repo","issueNumber"],"type":"object"}},"name":"assign_copilot_to_issue","description":"Assign Copilot to a specific issue in a GitHub repository.\n\nThis tool can help with the following outcomes:\n- a Pull Request created with source code changes to resolve the issue\n\n\nMore information can be found at:\n- https://docs.github.com/en/copilot/using-github-copilot/using-copilot-coding-agent-to-work-on-tasks/about-assigning-tasks-to-copilot\n"},{"inputSchema":{"json":{"properties":{"body":{"description":"Review comment text","type":"string"},"commitID":{"description":"SHA of commit to review","type":"string"},"event":{"description":"Review action to perform","enum":["APPROVE","REQUEST_CHANGES","COMMENT"],"type":"string"},"owner":{"description":"Repository owner","type":"string"},"pullNumber":{"description":"Pull request number","type":"number"},"repo":{"description":"Repository name","type":"string"}},"required":["owner","repo","pullNumber","body","event"],"type":"object"}},"name":"create_and_submit_pull_request_review","description":"Create and submit a review for a pull request without review comments."},{"inputSchema":{"json":{"properties":{"branch":{"description":"Name for new branch","type":"string"},"from_branch":{"description":"Source branch (defaults to repo default)","type":"string"},"owner":{"description":"Repository owner","type":"string"},"repo":{"description":"Repository name","type":"string"}},"required":["owner","repo","branch"],"type":"object"}},"name":"create_branch","description":"Create a new branch in a GitHub repository"},{"inputSchema":{"json":{"properties":{"assignees":{"description":"Usernames to assign to this issue","items":{"type":"string"},"type":"array"},"body":{"description":"Issue body content","type":"string"},"labels":{"description":"Labels to apply to this issue","items":{"type":"string"},"type":"array"},"milestone":{"description":"Milestone number","type":"number"},"owner":{"description":"Repository owner","type":"string"},"repo":{"description":"Repository name","type":"string"},"title":{"description":"Issue title","type":"string"}},"required":["owner","repo","title"],"type":"object"}},"name":"create_issue","description":"Create a new issue in a GitHub repository."},{"inputSchema":{"json":{"properties":{"branch":{"description":"Branch to create/update the file in","type":"string"},"content":{"description":"Content of the file","type":"string"},"message":{"description":"Commit message","type":"string"},"owner":{"description":"Repository owner (username or organization)","type":"string"},"path":{"description":"Path where to create/update the file","type":"string"},"repo":{"description":"Repository name","type":"string"},"sha":{"description":"SHA of file being replaced (for updates)","type":"string"}},"required":["ow
... (truncated)
CSV: N/A
TSV: N/A
YAML
chars: 38,139 tokens: 16,770 chars_og/tok: 3.1 enc_chars/tok: 2.3
- description: Add a comment to a specific issue in a GitHub repository.
· inputSchema:
··· json:
····· properties:
······· body:
········· description: Comment content
········· type: string
······· issue_number:
········· description: Issue number to comment on
········· type: number
······· owner:
········· description: Repository owner
········· type: string
······· repo:
········· description: Repository name
········· type: string
····· required:
····· - owner
····· - repo
····· - issue_number
····· - body
····· type: object
· name: add_issue_comment
- description: Add a comment to the requester's latest pending pull request review,
··· a pending review needs to already exist to call this (check with the user if not
... (truncated)
TOON
chars: 38,376 tokens: 17,296 chars_og/tok: 3.0 enc_chars/tok: 2.2
[51]:
· -
··· inputSchema:
····· json:
······· properties:
········· body:
··········· description: Comment content
··········· type: string
········· issue_number:
··········· description: Issue number to comment on
··········· type: number
········· owner:
··········· description: Repository owner
··········· type: string
········· repo:
··········· description: Repository name
··········· type: string
······· required[4]: owner,repo,issue_number,body
······· type: object
··· name: add_issue_comment
··· description: Add a comment to a specific issue in a GitHub repository.
· -
··· inputSchema:
····· json:
······· properties:
... (truncated)
TSON
chars: 25,878 tokens: 7,318 chars_og/tok: 7.1 enc_chars/tok: 3.5
{@inputSchema(@json),name,description#51|{{@properties,required,type|{@body,issue_number,owner,repo|{@description,type|"Comment content",string},{@description,type|"Issue number to comment on",number},{@description,type|"Repository owner",string},{@description,type|"Repository name",string}},[owner,repo,issue_number,body],object}},add_issue_comment,"Add a comment to a specific issue in a GitHub repository."|{{@properties,required,type|{@body,line,owner,path,pullNumber,repo,side,startLine,startSide,subjectType|{@description,type|"The text of the review comment",string},{@description,type|"The line of the blob in the pull request diff that the comment applies to. For multi-line comments, the last line of the range",number},{@description,type|"Repository owner",string},{@description,type|"The relative path to the file that necessitates a comment",string},{@description,type|"Pull request number",number},{@description,type|"Repository name",string},{@description,enum,type|"The side of the diff to comment on. LEFT indicates the previous state, RIGHT indicates the new state",[LEFT,RIGHT],string},{@description,type|"For multi-line comments, the first line of the range that the comment applies to",number},{@description,enum,type|"For multi-line comments, the starting side of the diff that the comment applies to. LEFT indicates the previous state, RIGHT indicates the new state",[LEFT,RIGHT],string},{@description,enum,type|"The level at which the comment is targeted",[FILE,LINE],string}},[owner,repo,pullNumber,path,body,subjectType],object}},add_pull_request_review_comment_to_pending_review,"Add a comment to the requester's latest pending pull request review, a pending review needs to already exist to call this (check with the user if not sure)."|{{@properties,required,type|{@issueNumber,owner,repo|{@description,type|"Issue number",number},{@description,type|"Repository owner",string},{@description,type|"Repository name",string}},[owner,repo,issueNumber],object}},assign_copilot_to_issue,"Assign Copilot to a specific issue in a GitHub repository.\n\nThis tool can help with the following outcomes:\n- a Pull Request created with source code changes to resolve the issue\n\n\nMore information can be found at:\n- https://docs.github.com/en/copilot/using-github-copilot/using-copilot-coding-agent-to-work-on-tasks/about-assigning-tasks-to-copilot\n"|{{@properties,required,type|{@body,commitID,event,owner,pullNumber,repo|{@description,type|"Review comment text",string},{@description,type|"SHA of commit to review",string},{@description,enum,type|"Review action to perform",[APPROVE,REQUEST_CHANGES,COMMENT],string},{@description,type|"Repository owner",string},{@description,type|"Pull request number",number},{@description,type|"Repository name",string}},[owner,repo,pullNumber,body,event],object}},create_and_submit_pull_request_review,"Create and submit a review for a pull request without review comments."|{{@properties,required,type|{@branch,from_branch,owner,repo|{@description,type|"Name for new branch",string},{@description,type|"Source branch (defaults to repo default)",string},{@description,type|"Repository owner",string},{@description,type|"Repository name",string}},[owner,repo,branch],object}},create_branch,"Create a new branch in a GitHub repository"|{{@properties,required,type|{@assignees,body,labels,milestone,owner,repo,title|{@description,items,type|"Usernames to assign to this issue",{@type|string},array},{@description,type|"Issue body content",string},{@description,items,type|"Labels to apply to this issue",{@type|string},array},{@description,type|"Milestone number",number},{@description,type|"Repository owner",string},{@description,type|"Repository name",string},{@description,type|"Issue title",string}},[owner,repo,title],object}},create_issue,"Create a new issue in a GitHub repository."|{{@properties,required,type|{@branch,content,message,owner,path,repo,sha|{@description,type|"Branch to create/update the file in",string},{@description,type|"Content of the file",string},{@description,type|"Commit message",string},{@description,type|"Repository owner (username or organization)",string},{@description,type|"Path where to create/update the file",string},{@description,type|"Repository name",string},{@description,type|"SHA of file being replaced (for updates)",string}},[owner,repo,path,content,message,branch],object}},create_or_update_file,"Create or update a single file in a GitHub repository. If updating, you must provide the SHA of the file you want to update."|{{@properties,required,type|{@commitID,owner,pullNumber,repo|{@description,type|"SHA of commit to review",string},{@description,type|"Repository owner",string},{@description,type|"Pull request number",number},{@description,type|"Repository name",string}},[owner,repo,pullNumber],object}},create_pending_pull_request_review,"Create a pending review for a pull request. Call this first before attempting to add comments to a pending review, and ultimately submitting it
... (truncated)
minemizer
chars: 23,383 tokens: 5,559 chars_og/tok: 9.3 enc_chars/tok: 4.2
inputSchema{ json{ properties{ owner{ description; type}; repo{ description; type}; ...}; required[]; type}}; name; description
{{ {{ Repository owner; string};{ Repository name; string}; body:{ description: Comment content; type: string}; issue_number:{ description: Issue number to comment on; type: number}};[ owner; repo; issue_number; body]; object}}; add_issue_comment; Add a comment to a specific issue in a GitHub repository.
{{ {{ Repository owner; string};{ Repository name; string}; body:{ description: The text of the review comment; type: string}; line:{ description: The line of the blob in the pull request diff that the comment applies to. For multi-line comments, the last line of the range; type: number}; path:{ description: The relative path to the file that necessitates a comment; type: string}; pullNumber:{ description: Pull request number; type: number}; side:{ description: The side of the diff to comment on. LEFT indicates the previous state, RIGHT indicates the new state; enum:[ LEFT; RIGHT]; type: string}; startLine:{ description: For multi-line comments, the first line of the range that the comment applies to; type: number}; startSide:{ description: For multi-line comments, the starting side of the diff that the comment applies to. LEFT indicates the previous state, RIGHT indicates the new state; enum:[ LEFT; RIGHT]; type: string}; subjectType:{ description: The level at which the comment is targeted; enum:[ FILE; LINE]; type: string}};[ owner; repo; pullNumber; path; body; subjectType]; object}}; add_pull_request_review_comment_to_pending_review; Add a comment to the requester's latest pending pull request review, a pending review needs to already exist to call this (check with the user if not sure).
{{ {{ Repository owner; string};{ Repository name; string}; issueNumber:{ description: Issue number; type: number}};[ owner; repo; issueNumber]; object}}; assign_copilot_to_issue; Assign Copilot to a specific issue in a GitHub repository.

This tool can help with the following outcomes:
- a Pull Request created with source code changes to resolve the issue↵↵

More information can be found at:
- https://docs.github.com/en/copilot/using-github-copilot/using-copilot-coding-agent-to-work-on-tasks/about-assigning-tasks-to-copilot

{{ {{ Repository owner; string};{ Repository name; string}; body:{ description: Review comment text; type: string}; commitID:{ description: SHA of commit to review; type: string}; event:{ description: Review action to perform; enum:[ APPROVE; REQUEST_CHANGES; COMMENT]; type: string}; pullNumber:{ description: Pull request number; type: number}};[ owner; repo; pullNumber; body; event]; object}}; create_and_submit_pull_request_review; Create and submit a review for a pull request without review comments.
{{ {{ Repository owner; string};{ Repository name; string}; branch:{ description: Name for new branch; type: string}; from_branch:{ description: Source branch (defaults to repo default); type: string}};[ owner; repo; branch]; object}}; create_branch; Create a new branch in a GitHub repository
{{ {{ Repository owner; string};{ Repository name; string}; assignees:{ description: Usernames to assign to this issue; items:{ type: string}; type: array}; body:{ description: Issue body content; type: string}; labels:{ description: Labels to apply to this issue; items:{ type: string}; type: array}; milestone:{ description: Milestone number; type: number}; title:{ description: Issue title; type: string}};[ owner; repo; title]; object}}; create_issue; Create a new issue in a GitHub repository.
{{ {{ Repository owner (username or organization); string};{ Repository name; string}; branch:{ description: Branch to create/update the file in; type: string}; content:{ description: Content of the file; type: string}; message:{ description: Commit message; type: string}; path:{ description: Path where to create/update the file; type: string}; sha:{ description: SHA of file being replaced (for updates); type: string}};[ owner; repo; path; content; message; branch]; object}}; create_or_update_file; Create or update a single file in a GitHub repository. If updating, you must provide the SHA of the file you want to update.
{{ {{ Repository owner; string};{ Repository name; string}; commitID:{ description: SHA of commit to review; type: string}; pullNumber:{ description: Pull request number; type: number}};[ owner; repo; pullNumber]; object}}; create_pending_pull_request_review; Create a pending review for a pull request. Call this first before attempting to add comments to a pending review, and ultimately submitting it. A pending pull request review means a pull request review, it is pending because you create it first and submit it later, and the PR author will not see it until it is submitted.
{{ {{ Repository owner; string};{ Repository name; string}; base:{ description: Branch to merge into; type: string}; body:{ description: PR description; type: string}; draft:{ description: Create as draft PR; type: boolean}; head:{ description: Branch containing changes; type: string}; maintainer_can_modify:{ description: Allow maintainer edits; type: boolean}; title:{ description: PR title; type: string}};[ owner; repo; title; head; base]; object}}; create_pull_request; Create a new pull request in a GitHub repository.
{{ {;; autoInit:{ description: Initialize with README; type: boolean}; description:{ description: Repository description; type: string}; name:{ description: Repository name; type: string}; private:{ description: Whether repo should be private; type: boolean}};[ name]; object}}; create_repository; Create a new GitHub repository in your account
{{ {{ Repository owner (username or organization); string};{ Repository name; string}; branch:{ description: Branch to delete the file from; type: string}; message:{ description: Commit message; type: string}; path:{ description: Path to the file to delete; type: string}};[ owner; repo; path; message; branch]; object}}; delete_file; Delete a file from a GitHub repository
{{ {{ Repository owner; string};{ Repository name; string}; pullNumber:{ description: Pull request number; type: number}};[ owner; repo; pullNumber]; object}}; delete_pending_pull_request_review; Delete the requester's latest pending pull request review. Use this after the user decides not to submit a pending review, if you don't know if they already created one then check first.
{{ {;; state:{ description: The new state of the notification (read/done); enum:[ read; done]; type: string}; threadID:{ description: The ID of the notification thread; type: string}};[ threadID]; object}}; dismiss_notification; Dismiss a notification by marking it as read or done
{{ {{ Repository owner; string};{ Repository name; string}; organization:{ description: Organization to fork to; type: string}};[ owner; repo]; object}}; fork_repository; Fork a GitHub repository to your account or specified organization
{{ {{ The owner of the repository.; string};{ The name of the repository.; string}; alertNumber:{ description: The number of the alert.; type: number}};[ owner; repo; alertNumber]; object}}; get_code_scanning_alert; Get details of a specific code scanning alert in a GitHub repository.
{{ {{ Repository owner; string};{ Repository name; string}; page:{ description: Page number for pagination (min 1); minimum: 1; type: number}; perPage:{ description: Results per page for pagination (min 1, max 100); maximum: 100; minimum: 1; type: number}; sha:{ description: Commit SHA, branch name, or tag name; type: string}};[ owner; repo; sha]; object}}; get_commit; Get details for a commit from a GitHub repository
... (truncated)
minemizer (compact)
chars: 21,912 tokens: 5,672 chars_og/tok: 9.1 enc_chars/tok: 3.9
inputSchema{json{properties{owner{description;type};repo{description;type};...};required[];type}};name;description
{{{{Repository owner;string};{Repository name;string};body:{description:Comment content;type:string};issue_number:{description:Issue number to comment on;type:number}};[owner;repo;issue_number;body];object}};add_issue_comment;Add a comment to a specific issue in a GitHub repository.
{{{{Repository owner;string};{Repository name;string};body:{description:The text of the review comment;type:string};line:{description:The line of the blob in the pull request diff that the comment applies to. For multi-line comments, the last line of the range;type:number};path:{description:The relative path to the file that necessitates a comment;type:string};pullNumber:{description:Pull request number;type:number};side:{description:The side of the diff to comment on. LEFT indicates the previous state, RIGHT indicates the new state;enum:[LEFT;RIGHT];type:string};startLine:{description:For multi-line comments, the first line of the range that the comment applies to;type:number};startSide:{description:For multi-line comments, the starting side of the diff that the comment applies to. LEFT indicates the previous state, RIGHT indicates the new state;enum:[LEFT;RIGHT];type:string};subjectType:{description:The level at which the comment is targeted;enum:[FILE;LINE];type:string}};[owner;repo;pullNumber;path;body;subjectType];object}};add_pull_request_review_comment_to_pending_review;Add a comment to the requester's latest pending pull request review, a pending review needs to already exist to call this (check with the user if not sure).
{{{{Repository owner;string};{Repository name;string};issueNumber:{description:Issue number;type:number}};[owner;repo;issueNumber];object}};assign_copilot_to_issue;Assign Copilot to a specific issue in a GitHub repository.

This tool can help with the following outcomes:
- a Pull Request created with source code changes to resolve the issue↵↵

More information can be found at:
- https://docs.github.com/en/copilot/using-github-copilot/using-copilot-coding-agent-to-work-on-tasks/about-assigning-tasks-to-copilot

{{{{Repository owner;string};{Repository name;string};body:{description:Review comment text;type:string};commitID:{description:SHA of commit to review;type:string};event:{description:Review action to perform;enum:[APPROVE;REQUEST_CHANGES;COMMENT];type:string};pullNumber:{description:Pull request number;type:number}};[owner;repo;pullNumber;body;event];object}};create_and_submit_pull_request_review;Create and submit a review for a pull request without review comments.
{{{{Repository owner;string};{Repository name;string};branch:{description:Name for new branch;type:string};from_branch:{description:Source branch (defaults to repo default);type:string}};[owner;repo;branch];object}};create_branch;Create a new branch in a GitHub repository
{{{{Repository owner;string};{Repository name;string};assignees:{description:Usernames to assign to this issue;items:{type:string};type:array};body:{description:Issue body content;type:string};labels:{description:Labels to apply to this issue;items:{type:string};type:array};milestone:{description:Milestone number;type:number};title:{description:Issue title;type:string}};[owner;repo;title];object}};create_issue;Create a new issue in a GitHub repository.
{{{{Repository owner (username or organization);string};{Repository name;string};branch:{description:Branch to create/update the file in;type:string};content:{description:Content of the file;type:string};message:{description:Commit message;type:string};path:{description:Path where to create/update the file;type:string};sha:{description:SHA of file being replaced (for updates);type:string}};[owner;repo;path;content;message;branch];object}};create_or_update_file;Create or update a single file in a GitHub repository. If updating, you must provide the SHA of the file you want to update.
{{{{Repository owner;string};{Repository name;string};commitID:{description:SHA of commit to review;type:string};pullNumber:{description:Pull request number;type:number}};[owner;repo;pullNumber];object}};create_pending_pull_request_review;Create a pending review for a pull request. Call this first before attempting to add comments to a pending review, and ultimately submitting it. A pending pull request review means a pull request review, it is pending because you create it first and submit it later, and the PR author will not see it until it is submitted.
{{{{Repository owner;string};{Repository name;string};base:{description:Branch to merge into;type:string};body:{description:PR description;type:string};draft:{description:Create as draft PR;type:boolean};head:{description:Branch containing changes;type:string};maintainer_can_modify:{description:Allow maintainer edits;type:boolean};title:{description:PR title;type:string}};[owner;repo;title;head;base];object}};create_pull_request;Create a new pull request in a GitHub repository.
{{{;;autoInit:{description:Initialize with README;type:boolean};description:{description:Repository description;type:string};name:{description:Repository name;type:string};private:{description:Whether repo should be private;type:boolean}};[name];object}};create_repository;Create a new GitHub repository in your account
{{{{Repository owner (username or organization);string};{Repository name;string};branch:{description:Branch to delete the file from;type:string};message:{description:Commit message;type:string};path:{description:Path to the file to delete;type:string}};[owner;repo;path;message;branch];object}};delete_file;Delete a file from a GitHub repository
{{{{Repository owner;string};{Repository name;string};pullNumber:{description:Pull request number;type:number}};[owner;repo;pullNumber];object}};delete_pending_pull_request_review;Delete the requester's latest pending pull request review. Use this after the user decides not to submit a pending review, if you don't know if they already created one then check first.
{{{;;state:{description:The new state of the notification (read/done);enum:[read;done];type:string};threadID:{description:The ID of the notification thread;type:string}};[threadID];object}};dismiss_notification;Dismiss a notification by marking it as read or done
{{{{Repository owner;string};{Repository name;string};organization:{description:Organization to fork to;type:string}};[owner;repo];object}};fork_repository;Fork a GitHub repository to your account or specified organization
{{{{The owner of the repository.;string};{The name of the repository.;string};alertNumber:{description:The number of the alert.;type:number}};[owner;repo;alertNumber];object}};get_code_scanning_alert;Get details of a specific code scanning alert in a GitHub repository.
{{{{Repository owner;string};{Repository name;string};page:{description:Page number for pagination (min 1);minimum:1;type:number};perPage:{description:Results per page for pagination (min 1, max 100);maximum:100;minimum:1;type:number};sha:{description:Commit SHA, branch name, or tag name;type:string}};[owner;repo;sha];object}};get_commit;Get details for a commit from a GitHub repository
... (truncated)
simple_flat.json — Original: 763 chars — Tokenizer: llama (NousResearch/Llama-2-7b-hf)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)7633342.32.3
JSON (min)5221654.63.2
CSV2341017.62.3
TSV2341017.62.3
YAML4891804.22.7
TOON2461037.42.4
TSON229958.02.4
minemizer251839.23.0
minemizer (compact)224918.42.5
JSON (pretty)
chars: 763 tokens: 334 chars_og/tok: 2.3 enc_chars/tok: 2.3
<s>[
{
··"id":1,
··"name":"Alice",
··"role":"Engineer",
··"department":"Backend"
},
{
··"id":2,
··"name":"Bob",
··"role":"Designer",
··"department":"Frontend"
},
{
··"id":3,
··"name":"Carol",
··"role":"Manager",
··"department":"Product"
},
{
··"id":4,
··"name":"David",
··"role":"Engineer",
··"department":"Infrastructure"
},
... (truncated)
JSON (min)
chars: 522 tokens: 165 chars_og/tok: 4.6 enc_chars/tok: 3.2
<s>[{"id":1,"name":"Alice","role":"Engineer","department":"Backend"},{"id":2,"name":"Bob","role":"Designer","department":"Frontend"},{"id":3,"name":"Carol","role":"Manager","department":"Product"},{"id":4,"name":"David","role":"Engineer","department":"Infrastructure"},{"id":5,"name":"Eva","role":"Analyst","department":"Data"},{"id":6,"name":"Frank","role":"Engineer","department":"Backend"},{"id":7,"name":"Grace","role":"Designer","department":"Mobile"},{"id":8,"name":"Henry","role":"Manager","department":"Engineering"}]
CSV
chars: 234 tokens: 101 chars_og/tok: 7.6 enc_chars/tok: 2.3
<s>id,name,role,department
1,Alice,Engineer,Backend
2,Bob,Designer,Frontend
3,Carol,Manager,Product
4,David,Engineer,Infrastructure
5,Eva,Analyst,Data
6,Frank,Engineer,Backend
7,Grace,Designer,Mobile
8,Henry,Manager,Engineering
TSV
chars: 234 tokens: 101 chars_og/tok: 7.6 enc_chars/tok: 2.3
<s>idnameroledepartment
1AliceEngineerBackend
2BobDesignerFrontend
3CarolManagerProduct
4DavidEngineerInfrastructure
5EvaAnalystData
6FrankEngineerBackend
7GraceDesignerMobile
8HenryManagerEngineering
YAML
chars: 489 tokens: 180 chars_og/tok: 4.2 enc_chars/tok: 2.7
<s>-department:Backend
id:1
name:Alice
role:Engineer
-department:Frontend
id:2
name:Bob
role:Designer
-department:Product
id:3
name:Carol
role:Manager
-department:Infrastructure
id:4
name:David
role:Engineer
-department:Data
id:5
name:Eva
role:Analyst
-department:Backend
id:6
name:Frank
role:Engineer
-department:Mobile
... (truncated)
TOON
chars: 246 tokens: 103 chars_og/tok: 7.4 enc_chars/tok: 2.4
<s>[8]{id,name,role,department}:
·1,Alice,Engineer,Backend
·2,Bob,Designer,Frontend
·3,Carol,Manager,Product
·4,David,Engineer,Infrastructure
·5,Eva,Analyst,Data
·6,Frank,Engineer,Backend
·7,Grace,Designer,Mobile
·8,Henry,Manager,Engineering
TSON
chars: 229 tokens: 95 chars_og/tok: 8.0 enc_chars/tok: 2.4
<s>{@id,name,role,department#8|1,Alice,Engineer,Backend|2,Bob,Designer,Frontend|3,Carol,Manager,Product|4,David,Engineer,Infrastructure|5,Eva,Analyst,Data|6,Frank,Engineer,Backend|7,Grace,Designer,Mobile|8,Henry,Manager,Engineering}
minemizer
chars: 251 tokens: 83 chars_og/tok: 9.2 enc_chars/tok: 3.0
<s>id;name;role;department
1;Alice;Engineer;Backend
2;Bob;Designer;Frontend
3;Carol;Manager;Product
4;David;Engineer;Infrastructure
5;Eva;Analyst;Data
6;Frank;Engineer;Backend
7;Grace;Designer;Mobile
8;Henry;Manager;Engineering
minemizer (compact)
chars: 224 tokens: 91 chars_og/tok: 8.4 enc_chars/tok: 2.5
<s>id;name;role;department
1;Alice;Engineer;Backend
2;Bob;Designer;Frontend
3;Carol;Manager;Product
4;David;Engineer;Infrastructure
5;Eva;Analyst;Data
6;Frank;Engineer;Backend
7;Grace;Designer;Mobile
8;Henry;Manager;Engineering
nested_objects.json — Original: 1039 chars — Tokenizer: llama (NousResearch/Llama-2-7b-hf)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)1,0394352.42.4
JSON (min)6182114.92.9
CSVN/A
TSVN/A
YAML6292464.22.6
TOON6752384.42.8
TSON3061417.42.2
minemizer3251327.92.5
minemizer (compact)2901397.52.1
JSON (pretty)
chars: 1,039 tokens: 435 chars_og/tok: 2.4 enc_chars/tok: 2.4
<s>[
{
··"id":"u1",
··"name":"Lukas",
··"location":{
····"office":"KaunasHQ",
····"floor":12
··},
··"skills":[
····"python",
····"kubernetes"
··]
},
{
··"id":"u2",
··"name":"Emma",
··"location":{
····"office":"BostonHub",
····"floor":7
··},
··"skills":[
····"react",
····"typescript",
····"graphql"
··]
... (truncated)
JSON (min)
chars: 618 tokens: 211 chars_og/tok: 4.9 enc_chars/tok: 2.9
<s>[{"id":"u1","name":"Lukas","location":{"office":"KaunasHQ","floor":12},"skills":["python","kubernetes"]},{"id":"u2","name":"Emma","location":{"office":"BostonHub","floor":7},"skills":["react","typescript","graphql"]},{"id":"u3","name":"Pierre","location":{"office":"ParisOffice","floor":3},"skills":["rust"]},{"id":"u4","name":"Hana","location":{"office":"TokyoTower","floor":15},"skills":["go","docker"]},{"id":"u5","name":"Wei","location":{"office":"TaipeiCenter","floor":8},"skills":["java","spring"]},{"id":"u6","name":"Charlotte","location":{"office":"LondonBridge","floor":5},"skills":["python","django"]}]
CSV: N/A
TSV: N/A
YAML
chars: 629 tokens: 246 chars_og/tok: 4.2 enc_chars/tok: 2.6
<s>-id:u1
location:
··floor:12
··office:KaunasHQ
name:Lukas
skills:
-python
-kubernetes
-id:u2
location:
··floor:7
··office:BostonHub
name:Emma
skills:
-react
-typescript
-graphql
-id:u3
location:
··floor:3
··office:ParisOffice
name:Pierre
skills:
-rust
-id:u4
... (truncated)
TOON
chars: 675 tokens: 238 chars_og/tok: 4.4 enc_chars/tok: 2.8
<s>[6]:
-id:u1
··name:Lukas
··location:
····office:KaunasHQ
····floor:12
··skills[2]:python,kubernetes
-id:u2
··name:Emma
··location:
····office:BostonHub
····floor:7
··skills[3]:react,typescript,graphql
-id:u3
··name:Pierre
··location:
····office:ParisOffice
····floor:3
··skills[1]:rust
-id:u4
··name:Hana
··location:
····office:TokyoTower
····floor:15
··skills[2]:go,docker
... (truncated)
TSON
chars: 306 tokens: 141 chars_og/tok: 7.4 enc_chars/tok: 2.2
<s>{@id,name,location(@office,floor),skills#6|u1,Lukas,{"KaunasHQ",12},[python,kubernetes]|u2,Emma,{"BostonHub",7},[react,typescript,graphql]|u3,Pierre,{"ParisOffice",3},[rust]|u4,Hana,{"TokyoTower",15},[go,docker]|u5,Wei,{"TaipeiCenter",8},[java,spring]|u6,Charlotte,{"LondonBridge",5},[python,django]}
minemizer
chars: 325 tokens: 132 chars_og/tok: 7.9 enc_chars/tok: 2.5
<s>id;name;location{office;floor};skills[]
u1;Lukas;{KaunasHQ;12};[python;kubernetes]
u2;Emma;{BostonHub;7};[react;typescript;graphql]
u3;Pierre;{ParisOffice;3};[rust]
u4;Hana;{TokyoTower;15};[go;docker]
u5;Wei;{TaipeiCenter;8};[java;spring]
u6;Charlotte;{LondonBridge;5};[python;django]
minemizer (compact)
chars: 290 tokens: 139 chars_og/tok: 7.5 enc_chars/tok: 2.1
<s>id;name;location{office;floor};skills[]
u1;Lukas;{KaunasHQ;12};[python;kubernetes]
u2;Emma;{BostonHub;7};[react;typescript;graphql]
u3;Pierre;{ParisOffice;3};[rust]
u4;Hana;{TokyoTower;15};[go;docker]
u5;Wei;{TaipeiCenter;8};[java;spring]
u6;Charlotte;{LondonBridge;5};[python;django]
lists_of_primitives.json — Original: 610 chars — Tokenizer: llama (NousResearch/Llama-2-7b-hf)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)6102802.22.2
JSON (min)3301254.92.6
CSVN/A
TSVN/A
YAML3411573.92.2
TOON3391414.32.4
TSON168797.72.1
minemizer188797.72.4
minemizer (compact)165837.32.0
JSON (pretty)
chars: 610 tokens: 280 chars_og/tok: 2.2 enc_chars/tok: 2.2
<s>[
{
··"id":1,
··"name":"Alice",
··"skills":[
····"python",
····"go",
····"rust"
··]
},
{
··"id":2,
··"name":"Bob",
··"skills":[
····"javascript",
····"typescript"
··]
},
{
··"id":3,
··"name":"Carol",
··"skills":[
····"java",
····"kotlin",
····"scala",
... (truncated)
JSON (min)
chars: 330 tokens: 125 chars_og/tok: 4.9 enc_chars/tok: 2.6
<s>[{"id":1,"name":"Alice","skills":["python","go","rust"]},{"id":2,"name":"Bob","skills":["javascript","typescript"]},{"id":3,"name":"Carol","skills":["java","kotlin","scala","groovy"]},{"id":4,"name":"David","skills":["c","cpp"]},{"id":5,"name":"Eva","skills":["ruby","elixir","erlang"]},{"id":6,"name":"Frank","skills":["swift"]}]
CSV: N/A
TSV: N/A
YAML
chars: 341 tokens: 157 chars_og/tok: 3.9 enc_chars/tok: 2.2
<s>-id:1
name:Alice
skills:
-python
-go
-rust
-id:2
name:Bob
skills:
-javascript
-typescript
-id:3
name:Carol
skills:
-java
-kotlin
-scala
-groovy
-id:4
name:David
skills:
-c
-cpp
-id:5
name:Eva
... (truncated)
TOON
chars: 339 tokens: 141 chars_og/tok: 4.3 enc_chars/tok: 2.4
<s>[6]:
-id:1
··name:Alice
··skills[3]:python,go,rust
-id:2
··name:Bob
··skills[2]:javascript,typescript
-id:3
··name:Carol
··skills[4]:java,kotlin,scala,groovy
-id:4
··name:David
··skills[2]:c,cpp
-id:5
··name:Eva
··skills[3]:ruby,elixir,erlang
-id:6
··name:Frank
··skills[1]:swift
TSON
chars: 168 tokens: 79 chars_og/tok: 7.7 enc_chars/tok: 2.1
<s>{@id,name,skills#6|1,Alice,[python,go,rust]|2,Bob,[javascript,typescript]|3,Carol,[java,kotlin,scala,groovy]|4,David,[c,cpp]|5,Eva,[ruby,elixir,erlang]|6,Frank,[swift]}
minemizer
chars: 188 tokens: 79 chars_og/tok: 7.7 enc_chars/tok: 2.4
<s>id;name;skills[]
1;Alice;[python;go;rust]
2;Bob;[javascript;typescript]
3;Carol;[java;kotlin;scala;groovy]
4;David;[c;cpp]
5;Eva;[ruby;elixir;erlang]
6;Frank;[swift]
minemizer (compact)
chars: 165 tokens: 83 chars_og/tok: 7.3 enc_chars/tok: 2.0
<s>id;name;skills[]
1;Alice;[python;go;rust]
2;Bob;[javascript;typescript]
3;Carol;[java;kotlin;scala;groovy]
4;David;[c;cpp]
5;Eva;[ruby;elixir;erlang]
6;Frank;[swift]
sparse_data.json — Original: 611 chars — Tokenizer: llama (NousResearch/Llama-2-7b-hf)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)6112852.12.1
JSON (min)4001464.22.7
CSVN/A
TSVN/A
YAML3841583.92.4
TOON4381673.72.6
TSON3281454.22.3
minemizer200797.72.5
minemizer (compact)180886.92.0
JSON (pretty)
chars: 611 tokens: 285 chars_og/tok: 2.1 enc_chars/tok: 2.1
<s>[
{
··"id":1,
··"name":"Erik",
··"department":"Engineering"
},
{
··"id":2,
··"name":"Rachel",
··"department":"Design",
··"remote":true
},
{
··"id":3,
··"name":"Hans"
},
{
··"id":4,
··"name":"Kenji",
··"department":"Sales",
··"slack":"@kenji",
··"remote":false
},
{
··"id":5,
... (truncated)
JSON (min)
chars: 400 tokens: 146 chars_og/tok: 4.2 enc_chars/tok: 2.7
<s>[{"id":1,"name":"Erik","department":"Engineering"},{"id":2,"name":"Rachel","department":"Design","remote":true},{"id":3,"name":"Hans"},{"id":4,"name":"Kenji","department":"Sales","slack":"@kenji","remote":false},{"id":5,"name":"Mai","remote":true},{"id":6,"name":"Tom","department":"Engineering"},{"id":7,"name":"Priya","slack":"@priya","remote":true},{"id":8,"name":"Nina","department":"Marketing"}]
CSV: N/A
TSV: N/A
YAML
chars: 384 tokens: 158 chars_og/tok: 3.9 enc_chars/tok: 2.4
<s>-department:Engineering
id:1
name:Erik
-department:Design
id:2
name:Rachel
remote:true
-id:3
name:Hans
-department:Sales
id:4
name:Kenji
remote:false
slack:'@kenji'
-id:5
name:Mai
remote:true
-department:Engineering
id:6
name:Tom
-id:7
name:Priya
remote:true
slack:'@priya'
-department:Marketing
... (truncated)
TOON
chars: 438 tokens: 167 chars_og/tok: 3.7 enc_chars/tok: 2.6
<s>[8]:
-id:1
··name:Erik
··department:Engineering
-id:2
··name:Rachel
··department:Design
··remote:true
-id:3
··name:Hans
-id:4
··name:Kenji
··department:Sales
··slack:@kenji
··remote:false
-id:5
··name:Mai
··remote:true
-id:6
··name:Tom
··department:Engineering
-id:7
··name:Priya
··slack:@priya
··remote:true
... (truncated)
TSON
chars: 328 tokens: 145 chars_og/tok: 4.2 enc_chars/tok: 2.3
<s>[{@id,name,department|1,Erik,Engineering},{@id,name,department,remote|2,Rachel,Design,true},{@id,name|3,Hans},{@id,name,department,slack,remote|4,Kenji,Sales,"@kenji",false},{@id,name,remote|5,Mai,true},{@id,name,department|6,Tom,Engineering},{@id,name,slack,remote|7,Priya,"@priya",true},{@id,name,department|8,Nina,Marketing}]
minemizer
chars: 200 tokens: 79 chars_og/tok: 7.7 enc_chars/tok: 2.5
<s>id;name;department;remote
1;Erik;Engineering
2;Rachel;Design;true
3;Hans
4;Kenji;Sales;false;slack:@kenji
5;Mai;;true
6;Tom;Engineering
7;Priya;;true;slack:@priya
8;Nina;Marketing;
minemizer (compact)
chars: 180 tokens: 88 chars_og/tok: 6.9 enc_chars/tok: 2.0
<s>id;name;department;remote
1;Erik;Engineering
2;Rachel;Design;true
3;Hans
4;Kenji;Sales;false;slack:@kenji
5;Mai;;true
6;Tom;Engineering
7;Priya;;true;slack:@priya
8;Nina;Marketing;
complex_mixed.json — Original: 1320 chars — Tokenizer: llama (NousResearch/Llama-2-7b-hf)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)1,3205602.42.4
JSON (min)7602844.62.7
CSVN/A
TSVN/A
YAML8183383.92.4
TOON8813294.02.7
TSON4532375.61.9
minemizer4032036.52.0
minemizer (compact)3612146.21.7
JSON (pretty)
chars: 1,320 tokens: 560 chars_og/tok: 2.4 enc_chars/tok: 2.4
<s>[
{
··"id":1,
··"profile":{
····"name":"Grace",
····"location":{
······"city":"NYC",
······"country":"USA"
····}
··},
··"tags":[
····"admin",
····"verified"
··],
··"metadata":{
····"created":"2024-01-15"
··}
},
{
··"id":2,
··"profile":{
····"name":"Henry",
····"location":{
······"city":"London",
······"country":"UK"
... (truncated)
JSON (min)
chars: 760 tokens: 284 chars_og/tok: 4.6 enc_chars/tok: 2.7
<s>[{"id":1,"profile":{"name":"Grace","location":{"city":"NYC","country":"USA"}},"tags":["admin","verified"],"metadata":{"created":"2024-01-15"}},{"id":2,"profile":{"name":"Henry","location":{"city":"London","country":"UK"}},"tags":["user"],"metadata":{"created":"2024-02-20","updated":"2024-03-10"}},{"id":3,"profile":{"name":"Ivy","location":{"city":"Tokyo","country":"Japan"}},"tags":["moderator","verified","premium"],"metadata":{"created":"2024-01-05"}},{"id":4,"profile":{"name":"Jack","location":{"city":"Sydney","country":"Australia"}},"tags":["user","new"],"metadata":{"created":"2024-04-01"}},{"id":5,"profile":{"name":"Kate","location":{"city":"Berlin","country":"Germany"}},"tags":["admin"],"metadata":{"created":"2023-12-01","updated":"2024-02-15"}}]
CSV: N/A
TSV: N/A
YAML
chars: 818 tokens: 338 chars_og/tok: 3.9 enc_chars/tok: 2.4
<s>-id:1
metadata:
··created:'2024-01-15'
profile:
··location:
····city:NYC
····country:USA
··name:Grace
tags:
-admin
-verified
-id:2
metadata:
··created:'2024-02-20'
··updated:'2024-03-10'
profile:
··location:
····city:London
····country:UK
··name:Henry
tags:
-user
-id:3
metadata:
··created:'2024-01-05'
... (truncated)
TOON
chars: 881 tokens: 329 chars_og/tok: 4.0 enc_chars/tok: 2.7
<s>[5]:
-id:1
··profile:
····name:Grace
····location:
······city:NYC
······country:USA
··tags[2]:admin,verified
··metadata:
····created:2024-01-15
-id:2
··profile:
····name:Henry
····location:
······city:London
······country:UK
··tags[1]:user
··metadata:
····created:2024-02-20
····updated:2024-03-10
-id:3
··profile:
····name:Ivy
····location:
······city:Tokyo
... (truncated)
TSON
chars: 453 tokens: 237 chars_og/tok: 5.6 enc_chars/tok: 1.9
<s>{@id,profile(@name,location),tags,metadata#5|1,{Grace,{@city,country|NYC,USA}},[admin,verified],{@created|2024-01-15}|2,{Henry,{@city,country|London,UK}},[user],{@created,updated|2024-02-20,2024-03-10}|3,{Ivy,{@city,country|Tokyo,Japan}},[moderator,verified,premium],{@created|2024-01-05}|4,{Jack,{@city,country|Sydney,Australia}},[user,new],{@created|2024-04-01}|5,{Kate,{@city,country|Berlin,Germany}},[admin],{@created,updated|2023-12-01,2024-02-15}}
minemizer
chars: 403 tokens: 203 chars_og/tok: 6.5 enc_chars/tok: 2.0
<s>id;profile{name;location{city;country}};tags[];metadata{created;...}
1;{Grace;{NYC;USA}};[admin;verified];{2024-01-15}
2;{Henry;{London;UK}};[user];{2024-02-20;updated:2024-03-10}
3;{Ivy;{Tokyo;Japan}};[moderator;verified;premium];{2024-01-05}
4;{Jack;{Sydney;Australia}};[user;new];{2024-04-01}
5;{Kate;{Berlin;Germany}};[admin];{2023-12-01;updated:2024-02-15}
minemizer (compact)
chars: 361 tokens: 214 chars_og/tok: 6.2 enc_chars/tok: 1.7
<s>id;profile{name;location{city;country}};tags[];metadata{created;...}
1;{Grace;{NYC;USA}};[admin;verified];{2024-01-15}
2;{Henry;{London;UK}};[user];{2024-02-20;updated:2024-03-10}
3;{Ivy;{Tokyo;Japan}};[moderator;verified;premium];{2024-01-05}
4;{Jack;{Sydney;Australia}};[user;new];{2024-04-01}
5;{Kate;{Berlin;Germany}};[admin];{2023-12-01;updated:2024-02-15}
books.json — Original: 27902 chars — Tokenizer: llama (NousResearch/Llama-2-7b-hf)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)27,90211,6262.42.4
JSON (min)22,5018,0353.52.8
CSV14,0716,1514.52.3
TSV14,0576,3604.42.2
YAML22,4008,8593.12.5
TOON14,2776,1724.52.3
TSON14,4486,2294.52.3
minemizer14,4586,0424.62.4
minemizer (compact)13,7536,0564.62.3
JSON (pretty)
chars: 27,902 tokens: 11,626 chars_og/tok: 2.4 enc_chars/tok: 2.4
<s>[
{
··"author":"ChinuaAchebe",
··"country":"Nigeria",
··"imageLink":"images/things-fall-apart.jpg",
··"language":"English",
··"link":"https://en.wikipedia.org/wiki/Things_Fall_Apart\n",
··"pages":209,
··"title":"ThingsFallApart",
··"year":1958
},
{
··"author":"HansChristianAndersen",
··"country":"Denmark",
··"imageLink":"images/fairy-tales.jpg",
··"language":"Danish",
··"link":"https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.\n",
··"pages":784,
··"title":"Fairytales",
··"year":1836
},
{
··"author":"DanteAlighieri",
··"country":"Italy",
··"imageLink":"images/the-divine-comedy.jpg",
... (truncated)
JSON (min)
chars: 22,501 tokens: 8,035 chars_og/tok: 3.5 enc_chars/tok: 2.8
<s>[{"author":"ChinuaAchebe","country":"Nigeria","imageLink":"images/things-fall-apart.jpg","language":"English","link":"https://en.wikipedia.org/wiki/Things_Fall_Apart\n","pages":209,"title":"ThingsFallApart","year":1958},{"author":"HansChristianAndersen","country":"Denmark","imageLink":"images/fairy-tales.jpg","language":"Danish","link":"https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.\n","pages":784,"title":"Fairytales","year":1836},{"author":"DanteAlighieri","country":"Italy","imageLink":"images/the-divine-comedy.jpg","language":"Italian","link":"https://en.wikipedia.org/wiki/Divine_Comedy\n","pages":928,"title":"TheDivineComedy","year":1315},{"author":"Unknown","country":"SumerandAkkadianEmpire","imageLink":"images/the-epic-of-gilgamesh.jpg","language":"Akkadian","link":"https://en.wikipedia.org/wiki/Epic_of_Gilgamesh\n","pages":160,"title":"TheEpicOfGilgamesh","year":-1700},{"author":"Unknown","country":"AchaemenidEmpire","imageLink":"images/the-book-of-job.jpg","language":"Hebrew","link":"https://en.wikipedia.org/wiki/Book_of_Job\n","pages":176,"title":"TheBookOfJob","year":-600},{"author":"Unknown","country":"India/Iran/Iraq/Egypt/Tajikistan","imageLink":"images/one-thousand-and-one-nights.jpg","language":"Arabic","link":"https://en.wikipedia.org/wiki/One_Thousand_and_One_Nights\n","pages":288,"title":"OneThousandandOneNights","year":1200},{"author":"Unknown","country":"Iceland","imageLink":"images/njals-saga.jpg","language":"OldNorse","link":"https://en.wikipedia.org/wiki/Nj%C3%A1ls_saga\n","pages":384,"title":"Nj\u00e1l'sSaga","year":1350},{"author":"JaneAusten","country":"UnitedKingdom","imageLink":"images/pride-and-prejudice.jpg","language":"English","link":"https://en.wikipedia.org/wiki/Pride_and_Prejudice\n","pages":226,"title":"PrideandPrejudice","year":1813},{"author":"Honor\u00e9deBalzac","country":"France","imageLink":"images/le-pere-goriot.jpg","language":"French","link":"https://en.wikipedia.org/wiki/Le_P%C3%A8re_Goriot\n","pages":443,"title":"LeP\u00e8reGoriot","year":1835},{"author":"SamuelBeckett","country":"RepublicofIreland","imageLink":"images/molloy-malone-dies-the-unnamable.jpg","language":"French,English","link":"https://en.wikipedia.org/wiki/Molloy_(novel)\n","pages":256,"title":"Molloy,MaloneDies,TheUnnamable,thetrilogy","year":1952},{"author":"GiovanniBoccaccio","country":"Italy","imageLink":"images/the-decameron.jpg","language":"Italian","link":"https://en.wikipedia.org/wiki/The_Decameron\n","pages":1024,"title":"TheDecameron","year":1351},{"author":"JorgeLuisBorges","country":"Argentina","imageLink":"images/ficciones.jpg","language":"Spanish","link":"https://en.wikipedia.org/wiki/Ficciones\n","pages":224,"title":"Ficciones","year":1965},{"author":"EmilyBront\u00eb","country":"UnitedKingdom","imageLink":"images/wuthering-heights.jpg","language":"English","link":"https://en.wikipedia.org/wiki/Wuthering_Heights\n","pages":342,"title":"WutheringHeights","year":1847},{"author":"AlbertCamus","country":"Algeria,FrenchEmpire","imageLink":"images/l-etranger.jpg","language":"French","link":"https://en.wikipedia.org/wiki/The_Stranger_(novel)\n","pages":185,"title":"TheStranger","year":1942},{"author":"PaulCelan","country":"Romania,France","imageLink":"images/poems-paul-celan.jpg","language":"German","link":"\n","pages":320,"title":"Poems","year":1952},{"author":"Louis-FerdinandC\u00e9line","country":"France","imageLink":"images/voyage-au-bout-de-la-nuit.jpg","language":"French","link":"https://en.wikipedia.org/wiki/Journey_to_the_End_of_the_Night\n","pages":505,"title":"JourneytotheEndoftheNight","year":1932},{"author":"MigueldeCervantes","country":"Spain","imageLink":"images/don-quijote-de-la-mancha.jpg","language":"Spanish","link":"https://en.wikipedia.org/wiki/Don_Quixote\n","pages":1056,"title":"DonQuijoteDeLaMancha","year":1610},{"author":"GeoffreyChaucer","country":"England","imageLink":"images/the-canterbury-tales.jpg","language":"English","link":"https://en.wikipedia.org/wiki/The_Canterbury_Tales\n","pages":544,"title":"TheCanterburyTales","year":1450},{"author":"AntonChekhov","country":"Russia","imageLink":"images/stories-of-anton-chekhov.jpg","language":"Russian","link":"https://en.wikipedia.org/wiki/List_of_short_stories_by_Anton_Chekhov\n","pages":194,"title":"Stories","year":1886},{"author":"JosephConrad","country":"UnitedKingdom","imageLink":"images/nostromo.jpg","language":"English","link":"https://en.wikipedia.org/wiki/Nostromo\n","pages":320,"title":"Nostromo","year":1904},{"author":"CharlesDickens","country":"UnitedKingdom","imageLink":"images/great-expectations.jpg","language":"English","link":"https://en.wikipedia.org/wiki/Great_Expectations\n","pages":194,"title":"GreatExpectations","year":1861},{"author":"DenisDiderot","country":"France","imageLink":"images/jacques-the-fatalist.jpg","language":"French","link":"https://en.wikipedia.org/wiki/Jacques_the_Fatalis
... (truncated)
CSV
chars: 14,071 tokens: 6,151 chars_og/tok: 4.5 enc_chars/tok: 2.3
<s>author,country,imageLink,language,link,pages,title,year
ChinuaAchebe,Nigeria,images/things-fall-apart.jpg,English,"https://en.wikipedia.org/wiki/Things_Fall_Apart
",209,ThingsFallApart,1958
HansChristianAndersen,Denmark,images/fairy-tales.jpg,Danish,"https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.
",784,Fairytales,1836
DanteAlighieri,Italy,images/the-divine-comedy.jpg,Italian,"https://en.wikipedia.org/wiki/Divine_Comedy
",928,TheDivineComedy,1315
Unknown,SumerandAkkadianEmpire,images/the-epic-of-gilgamesh.jpg,Akkadian,"https://en.wikipedia.org/wiki/Epic_of_Gilgamesh
",160,TheEpicOfGilgamesh,-1700
Unknown,AchaemenidEmpire,images/the-book-of-job.jpg,Hebrew,"https://en.wikipedia.org/wiki/Book_of_Job
",176,TheBookOfJob,-600
Unknown,India/Iran/Iraq/Egypt/Tajikistan,images/one-thousand-and-one-nights.jpg,Arabic,"https://en.wikipedia.org/wiki/One_Thousand_and_One_Nights
",288,OneThousandandOneNights,1200
Unknown,Iceland,images/njals-saga.jpg,OldNorse,"https://en.wikipedia.org/wiki/Nj%C3%A1ls_saga
",384,Njál'sSaga,1350
JaneAusten,UnitedKingdom,images/pride-and-prejudice.jpg,English,"https://en.wikipedia.org/wiki/Pride_and_Prejudice
",226,PrideandPrejudice,1813
HonorédeBalzac,France,images/le-pere-goriot.jpg,French,"https://en.wikipedia.org/wiki/Le_P%C3%A8re_Goriot
",443,LePèreGoriot,1835
SamuelBeckett,RepublicofIreland,images/molloy-malone-dies-the-unnamable.jpg,"French,English","https://en.wikipedia.org/wiki/Molloy_(novel)
",256,"Molloy,MaloneDies,TheUnnamable,thetrilogy",1952
GiovanniBoccaccio,Italy,images/the-decameron.jpg,Italian,"https://en.wikipedia.org/wiki/The_Decameron
",1024,TheDecameron,1351
JorgeLuisBorges,Argentina,images/ficciones.jpg,Spanish,"https://en.wikipedia.org/wiki/Ficciones
",224,Ficciones,1965
... (truncated)
TSV
chars: 14,057 tokens: 6,360 chars_og/tok: 4.4 enc_chars/tok: 2.2
<s>authorcountryimageLinklanguagelinkpagestitleyear
ChinuaAchebeNigeriaimages/things-fall-apart.jpgEnglish"https://en.wikipedia.org/wiki/Things_Fall_Apart
"209ThingsFallApart1958
HansChristianAndersenDenmarkimages/fairy-tales.jpgDanish"https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.
"784Fairytales1836
DanteAlighieriItalyimages/the-divine-comedy.jpgItalian"https://en.wikipedia.org/wiki/Divine_Comedy
"928TheDivineComedy1315
UnknownSumerandAkkadianEmpireimages/the-epic-of-gilgamesh.jpgAkkadian"https://en.wikipedia.org/wiki/Epic_of_Gilgamesh
"160TheEpicOfGilgamesh-1700
UnknownAchaemenidEmpireimages/the-book-of-job.jpgHebrew"https://en.wikipedia.org/wiki/Book_of_Job
"176TheBookOfJob-600
UnknownIndia/Iran/Iraq/Egypt/Tajikistanimages/one-thousand-and-one-nights.jpgArabic"https://en.wikipedia.org/wiki/One_Thousand_and_One_Nights
"288OneThousandandOneNights1200
UnknownIcelandimages/njals-saga.jpgOldNorse"https://en.wikipedia.org/wiki/Nj%C3%A1ls_saga
"384Njál'sSaga1350
JaneAustenUnitedKingdomimages/pride-and-prejudice.jpgEnglish"https://en.wikipedia.org/wiki/Pride_and_Prejudice
"226PrideandPrejudice1813
HonorédeBalzacFranceimages/le-pere-goriot.jpgFrench"https://en.wikipedia.org/wiki/Le_P%C3%A8re_Goriot
"443LePèreGoriot1835
SamuelBeckettRepublicofIrelandimages/molloy-malone-dies-the-unnamable.jpgFrench,English"https://en.wikipedia.org/wiki/Molloy_(novel)
"256Molloy,MaloneDies,TheUnnamable,thetrilogy1952
GiovanniBoccaccioItalyimages/the-decameron.jpgItalian"https://en.wikipedia.org/wiki/The_Decameron
"1024TheDecameron1351
JorgeLuisBorgesArgentinaimages/ficciones.jpgSpanish"https://en.wikipedia.org/wiki/Ficciones
"224Ficciones1965
... (truncated)
YAML
chars: 22,400 tokens: 8,859 chars_og/tok: 3.1 enc_chars/tok: 2.5
<s>-author:ChinuaAchebe
country:Nigeria
imageLink:images/things-fall-apart.jpg
language:English
link:'https://en.wikipedia.org/wiki/Things_Fall_Apart

··'
pages:209
title:ThingsFallApart
year:1958
-author:HansChristianAndersen
country:Denmark
imageLink:images/fairy-tales.jpg
language:Danish
link:'https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.

··'
pages:784
title:Fairytales
year:1836
-author:DanteAlighieri
country:Italy
imageLink:images/the-divine-comedy.jpg
language:Italian
link:'https://en.wikipedia.org/wiki/Divine_Comedy
... (truncated)
TOON
chars: 14,277 tokens: 6,172 chars_og/tok: 4.5 enc_chars/tok: 2.3
<s>[100]{author,country,imageLink,language,link,pages,title,year}:
ChinuaAchebe,Nigeria,images/things-fall-apart.jpg,English,"https://en.wikipedia.org/wiki/Things_Fall_Apart\n",209,ThingsFallApart,1958
HansChristianAndersen,Denmark,images/fairy-tales.jpg,Danish,"https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.\n",784,Fairytales,1836
DanteAlighieri,Italy,images/the-divine-comedy.jpg,Italian,"https://en.wikipedia.org/wiki/Divine_Comedy\n",928,TheDivineComedy,1315
Unknown,SumerandAkkadianEmpire,images/the-epic-of-gilgamesh.jpg,Akkadian,"https://en.wikipedia.org/wiki/Epic_of_Gilgamesh\n",160,TheEpicOfGilgamesh,-1700
Unknown,AchaemenidEmpire,images/the-book-of-job.jpg,Hebrew,"https://en.wikipedia.org/wiki/Book_of_Job\n",176,TheBookOfJob,-600
Unknown,India/Iran/Iraq/Egypt/Tajikistan,images/one-thousand-and-one-nights.jpg,Arabic,"https://en.wikipedia.org/wiki/One_Thousand_and_One_Nights\n",288,OneThousandandOneNights,1200
Unknown,Iceland,images/njals-saga.jpg,OldNorse,"https://en.wikipedia.org/wiki/Nj%C3%A1ls_saga\n",384,Njál'sSaga,1350
JaneAusten,UnitedKingdom,images/pride-and-prejudice.jpg,English,"https://en.wikipedia.org/wiki/Pride_and_Prejudice\n",226,PrideandPrejudice,1813
HonorédeBalzac,France,images/le-pere-goriot.jpg,French,"https://en.wikipedia.org/wiki/Le_P%C3%A8re_Goriot\n",443,LePèreGoriot,1835
SamuelBeckett,RepublicofIreland,images/molloy-malone-dies-the-unnamable.jpg,"French,English","https://en.wikipedia.org/wiki/Molloy_(novel)\n",256,"Molloy,MaloneDies,TheUnnamable,thetrilogy",1952
GiovanniBoccaccio,Italy,images/the-decameron.jpg,Italian,"https://en.wikipedia.org/wiki/The_Decameron\n",1024,TheDecameron,1351
JorgeLuisBorges,Argentina,images/ficciones.jpg,Spanish,"https://en.wikipedia.org/wiki/Ficciones\n",224,Ficciones,1965
EmilyBrontë,UnitedKingdom,images/wuthering-heights.jpg,English,"https://en.wikipedia.org/wiki/Wuthering_Heights\n",342,WutheringHeights,1847
AlbertCamus,"Algeria,FrenchEmpire",images/l-etranger.jpg,French,"https://en.wikipedia.org/wiki/The_Stranger_(novel)\n",185,TheStranger,1942
PaulCelan,"Romania,France",images/poems-paul-celan.jpg,German,"\n",320,Poems,1952
Louis-FerdinandCéline,France,images/voyage-au-bout-de-la-nuit.jpg,French,"https://en.wikipedia.org/wiki/Journey_to_the_End_of_the_Night\n",505,JourneytotheEndoftheNight,1932
MigueldeCervantes,Spain,images/don-quijote-de-la-mancha.jpg,Spanish,"https://en.wikipedia.org/wiki/Don_Quixote\n",1056,DonQuijoteDeLaMancha,1610
GeoffreyChaucer,England,images/the-canterbury-tales.jpg,English,"https://en.wikipedia.org/wiki/The_Canterbury_Tales\n",544,TheCanterburyTales,1450
AntonChekhov,Russia,images/stories-of-anton-chekhov.jpg,Russian,"https://en.wikipedia.org/wiki/List_of_short_stories_by_Anton_Chekhov\n",194,Stories,1886
JosephConrad,UnitedKingdom,images/nostromo.jpg,English,"https://en.wikipedia.org/wiki/Nostromo\n",320,Nostromo,1904
CharlesDickens,UnitedKingdom,images/great-expectations.jpg,English,"https://en.wikipedia.org/wiki/Great_Expectations\n",194,GreatExpectations,1861
DenisDiderot,France,images/jacques-the-fatalist.jpg,French,"https://en.wikipedia.org/wiki/Jacques_the_Fatalist\n",596,JacquestheFatalist,1796
AlfredDöblin,Germany,images/berlin-alexanderplatz.jpg,German,"https://en.wikipedia.org/wiki/Berlin_Alexanderplatz\n",600,BerlinAlexanderplatz,1929
FyodorDostoevsky,Russia,images/crime-and-punishment.jpg,Russian,"https://en.wikipedia.org/wiki/Crime_and_Punishment\n",551,CrimeandPunishment,1866
... (truncated)
TSON
chars: 14,448 tokens: 6,229 chars_og/tok: 4.5 enc_chars/tok: 2.3
<s>{@author,country,imageLink,language,link,pages,title,year#100|"ChinuaAchebe",Nigeria,images/things-fall-apart.jpg,English,"https://en.wikipedia.org/wiki/Things_Fall_Apart\n",209,"ThingsFallApart",1958|"HansChristianAndersen",Denmark,images/fairy-tales.jpg,Danish,"https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.\n",784,"Fairytales",1836|"DanteAlighieri",Italy,images/the-divine-comedy.jpg,Italian,"https://en.wikipedia.org/wiki/Divine_Comedy\n",928,"TheDivineComedy",1315|Unknown,"SumerandAkkadianEmpire",images/the-epic-of-gilgamesh.jpg,Akkadian,"https://en.wikipedia.org/wiki/Epic_of_Gilgamesh\n",160,"TheEpicOfGilgamesh",-1700|Unknown,"AchaemenidEmpire",images/the-book-of-job.jpg,Hebrew,"https://en.wikipedia.org/wiki/Book_of_Job\n",176,"TheBookOfJob",-600|Unknown,India/Iran/Iraq/Egypt/Tajikistan,images/one-thousand-and-one-nights.jpg,Arabic,"https://en.wikipedia.org/wiki/One_Thousand_and_One_Nights\n",288,"OneThousandandOneNights",1200|Unknown,Iceland,images/njals-saga.jpg,"OldNorse","https://en.wikipedia.org/wiki/Nj%C3%A1ls_saga\n",384,"Njál'sSaga",1350|"JaneAusten","UnitedKingdom",images/pride-and-prejudice.jpg,English,"https://en.wikipedia.org/wiki/Pride_and_Prejudice\n",226,"PrideandPrejudice",1813|"HonorédeBalzac",France,images/le-pere-goriot.jpg,French,"https://en.wikipedia.org/wiki/Le_P%C3%A8re_Goriot\n",443,"LePèreGoriot",1835|"SamuelBeckett","RepublicofIreland",images/molloy-malone-dies-the-unnamable.jpg,"French,English","https://en.wikipedia.org/wiki/Molloy_(novel)\n",256,"Molloy,MaloneDies,TheUnnamable,thetrilogy",1952|"GiovanniBoccaccio",Italy,images/the-decameron.jpg,Italian,"https://en.wikipedia.org/wiki/The_Decameron\n",1024,"TheDecameron",1351|"JorgeLuisBorges",Argentina,images/ficciones.jpg,Spanish,"https://en.wikipedia.org/wiki/Ficciones\n",224,Ficciones,1965|"EmilyBrontë","UnitedKingdom",images/wuthering-heights.jpg,English,"https://en.wikipedia.org/wiki/Wuthering_Heights\n",342,"WutheringHeights",1847|"AlbertCamus","Algeria,FrenchEmpire",images/l-etranger.jpg,French,"https://en.wikipedia.org/wiki/The_Stranger_(novel)\n",185,"TheStranger",1942|"PaulCelan","Romania,France",images/poems-paul-celan.jpg,German,"\n",320,Poems,1952|"Louis-FerdinandCéline",France,images/voyage-au-bout-de-la-nuit.jpg,French,"https://en.wikipedia.org/wiki/Journey_to_the_End_of_the_Night\n",505,"JourneytotheEndoftheNight",1932|"MigueldeCervantes",Spain,images/don-quijote-de-la-mancha.jpg,Spanish,"https://en.wikipedia.org/wiki/Don_Quixote\n",1056,"DonQuijoteDeLaMancha",1610|"GeoffreyChaucer",England,images/the-canterbury-tales.jpg,English,"https://en.wikipedia.org/wiki/The_Canterbury_Tales\n",544,"TheCanterburyTales",1450|"AntonChekhov",Russia,images/stories-of-anton-chekhov.jpg,Russian,"https://en.wikipedia.org/wiki/List_of_short_stories_by_Anton_Chekhov\n",194,Stories,1886|"JosephConrad","UnitedKingdom",images/nostromo.jpg,English,"https://en.wikipedia.org/wiki/Nostromo\n",320,Nostromo,1904|"CharlesDickens","UnitedKingdom",images/great-expectations.jpg,English,"https://en.wikipedia.org/wiki/Great_Expectations\n",194,"GreatExpectations",1861|"DenisDiderot",France,images/jacques-the-fatalist.jpg,French,"https://en.wikipedia.org/wiki/Jacques_the_Fatalist\n",596,"JacquestheFatalist",1796|"AlfredDöblin",Germany,images/berlin-alexanderplatz.jpg,German,"https://en.wikipedia.org/wiki/Berlin_Alexanderplatz\n",600,"BerlinAlexanderplatz",1929|"FyodorDostoevsky",Russia,images/crime-and-punishment.jpg,Russian,"https://en.wikipedia.org/wiki/Crime_and_Punishment\n",551,"CrimeandPunishment",1866|"FyodorDostoevsky",Russia,images/the-idiot.jpg,Russian,"https://en.wikipedia.org/wiki/The_Idiot\n",656,"TheIdiot",1869|"FyodorDostoevsky",Russia,images/the-possessed.jpg,Russian,"https://en.wikipedia.org/wiki/Demons_(Dostoyevsky_novel)\n",768,"ThePossessed",1872|"FyodorDostoevsky",Russia,images/the-brothers-karamazov.jpg,Russian,"https://en.wikipedia.org/wiki/The_Brothers_Karamazov\n",824,"TheBrothersKaramazov",1880|"GeorgeEliot","UnitedKingdom",images/middlemarch.jpg,English,"https://en.wikipedia.org/wiki/Middlemarch\n",800,Middlemarch,1871|"RalphEllison","UnitedStates",images/invisible-man.jpg,English,"https://en.wikipedia.org/wiki/Invisible_Man\n",581,"InvisibleMan",1952|Euripides,Greece,images/medea.jpg,Greek,"https://en.wikipedia.org/wiki/Medea_(play)\n",104,Medea,-431|"WilliamFaulkner","UnitedStates",images/absalom-absalom.jpg,English,"https://en.wikipedia.org/wiki/Absalom,_Absalom!\n",313,"Absalom,Absalom!",1936|"WilliamFaulkner","UnitedStates",images/the-sound-and-the-fury.jpg,English,"https://en.wikipedia.org/wiki/The_Sound_and_the_Fury\n",326,"TheSoundandtheFury",1929|"GustaveFlaubert",France,images/madame-bovary.jpg,French,"https://en.wikipedia.org/wiki/Madame_Bovary\n",528,"MadameBovary",1857|"GustaveFlaubert",France,images/l-education-sentimentale.jpg,French,"https://en.wikipedia.org/wiki/Sen
... (truncated)
minemizer
chars: 14,458 tokens: 6,042 chars_og/tok: 4.6 enc_chars/tok: 2.4
<s>author;country;imageLink;language;link;pages;title;year
ChinuaAchebe;Nigeria;images/things-fall-apart.jpg;English;https://en.wikipedia.org/wiki/Things_Fall_Apart
;209;ThingsFallApart;1958
HansChristianAndersen;Denmark;images/fairy-tales.jpg;Danish;https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.
;784;Fairytales;1836
DanteAlighieri;Italy;images/the-divine-comedy.jpg;Italian;https://en.wikipedia.org/wiki/Divine_Comedy
;928;TheDivineComedy;1315
Unknown;SumerandAkkadianEmpire;images/the-epic-of-gilgamesh.jpg;Akkadian;https://en.wikipedia.org/wiki/Epic_of_Gilgamesh
;160;TheEpicOfGilgamesh;-1700
Unknown;AchaemenidEmpire;images/the-book-of-job.jpg;Hebrew;https://en.wikipedia.org/wiki/Book_of_Job
;176;TheBookOfJob;-600
Unknown;India/Iran/Iraq/Egypt/Tajikistan;images/one-thousand-and-one-nights.jpg;Arabic;https://en.wikipedia.org/wiki/One_Thousand_and_One_Nights
;288;OneThousandandOneNights;1200
Unknown;Iceland;images/njals-saga.jpg;OldNorse;https://en.wikipedia.org/wiki/Nj%C3%A1ls_saga
;384;Njál'sSaga;1350
JaneAusten;UnitedKingdom;images/pride-and-prejudice.jpg;English;https://en.wikipedia.org/wiki/Pride_and_Prejudice
;226;PrideandPrejudice;1813
HonorédeBalzac;France;images/le-pere-goriot.jpg;French;https://en.wikipedia.org/wiki/Le_P%C3%A8re_Goriot
;443;LePèreGoriot;1835
SamuelBeckett;RepublicofIreland;images/molloy-malone-dies-the-unnamable.jpg;French,English;https://en.wikipedia.org/wiki/Molloy_(novel)
;256;Molloy,MaloneDies,TheUnnamable,thetrilogy;1952
GiovanniBoccaccio;Italy;images/the-decameron.jpg;Italian;https://en.wikipedia.org/wiki/The_Decameron
;1024;TheDecameron;1351
JorgeLuisBorges;Argentina;images/ficciones.jpg;Spanish;https://en.wikipedia.org/wiki/Ficciones
;224;Ficciones;1965
... (truncated)
minemizer (compact)
chars: 13,753 tokens: 6,056 chars_og/tok: 4.6 enc_chars/tok: 2.3
<s>author;country;imageLink;language;link;pages;title;year
ChinuaAchebe;Nigeria;images/things-fall-apart.jpg;English;https://en.wikipedia.org/wiki/Things_Fall_Apart
;209;ThingsFallApart;1958
HansChristianAndersen;Denmark;images/fairy-tales.jpg;Danish;https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.
;784;Fairytales;1836
DanteAlighieri;Italy;images/the-divine-comedy.jpg;Italian;https://en.wikipedia.org/wiki/Divine_Comedy
;928;TheDivineComedy;1315
Unknown;SumerandAkkadianEmpire;images/the-epic-of-gilgamesh.jpg;Akkadian;https://en.wikipedia.org/wiki/Epic_of_Gilgamesh
;160;TheEpicOfGilgamesh;-1700
Unknown;AchaemenidEmpire;images/the-book-of-job.jpg;Hebrew;https://en.wikipedia.org/wiki/Book_of_Job
;176;TheBookOfJob;-600
Unknown;India/Iran/Iraq/Egypt/Tajikistan;images/one-thousand-and-one-nights.jpg;Arabic;https://en.wikipedia.org/wiki/One_Thousand_and_One_Nights
;288;OneThousandandOneNights;1200
Unknown;Iceland;images/njals-saga.jpg;OldNorse;https://en.wikipedia.org/wiki/Nj%C3%A1ls_saga
;384;Njál'sSaga;1350
JaneAusten;UnitedKingdom;images/pride-and-prejudice.jpg;English;https://en.wikipedia.org/wiki/Pride_and_Prejudice
;226;PrideandPrejudice;1813
HonorédeBalzac;France;images/le-pere-goriot.jpg;French;https://en.wikipedia.org/wiki/Le_P%C3%A8re_Goriot
;443;LePèreGoriot;1835
SamuelBeckett;RepublicofIreland;images/molloy-malone-dies-the-unnamable.jpg;French,English;https://en.wikipedia.org/wiki/Molloy_(novel)
;256;Molloy,MaloneDies,TheUnnamable,thetrilogy;1952
GiovanniBoccaccio;Italy;images/the-decameron.jpg;Italian;https://en.wikipedia.org/wiki/The_Decameron
;1024;TheDecameron;1351
JorgeLuisBorges;Argentina;images/ficciones.jpg;Spanish;https://en.wikipedia.org/wiki/Ficciones
;224;Ficciones;1965
... (truncated)
countries.json — Original: 1133948 chars — Tokenizer: llama (NousResearch/Llama-2-7b-hf)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)1,133,948565,8802.02.0
JSON (min)787,962425,6602.71.9
CSVN/A
TSVN/A
YAML641,939251,6104.52.6
TOON691,140246,3604.62.8
TSON423,383196,4995.82.2
minemizer323,130152,3697.42.1
minemizer (compact)299,485156,3547.31.9
JSON (pretty)
chars: 1,133,948 tokens: 565,880 chars_og/tok: 2.0 enc_chars/tok: 2.0
<s>[
{
··"name":{
····"common":"Aruba",
····"official":"Aruba",
····"native":{
······"nld":{
········"official":"Aruba",
········"common":"Aruba"
······},
······"pap":{
········"official":"Aruba",
········"common":"Aruba"
······}
····}
··},
··"tld":[
····".aw"
··],
··"cca2":"AW",
··"ccn3":"533",
··"cca3":"ABW",
··"cioc":"ARU",
··"independent":false,
··"status":"officially-assigned",
... (truncated)
JSON (min)
chars: 787,962 tokens: 425,660 chars_og/tok: 2.7 enc_chars/tok: 1.9
<s>[{"name":{"common":"Aruba","official":"Aruba","native":{"nld":{"official":"Aruba","common":"Aruba"},"pap":{"official":"Aruba","common":"Aruba"}}},"tld":[".aw"],"cca2":"AW","ccn3":"533","cca3":"ABW","cioc":"ARU","independent":false,"status":"officially-assigned","unMember":false,"unRegionalGroup":"","currencies":{"AWG":{"name":"Arubanflorin","symbol":"\u0192"}},"idd":{"root":"+2","suffixes":["97"]},"capital":["Oranjestad"],"altSpellings":["AW"],"region":"Americas","subregion":"Caribbean","languages":{"nld":"Dutch","pap":"Papiamento"},"translations":{"ara":{"official":"\u0623\u0631\u0648\u0628\u0627","common":"\u0623\u0631\u0648\u0628\u0627"},"bre":{"official":"Aruba","common":"Aruba"},"ces":{"official":"Aruba","common":"Aruba"},"deu":{"official":"Aruba","common":"Aruba"},"est":{"official":"Aruba","common":"Aruba"},"fin":{"official":"Aruba","common":"Aruba"},"fra":{"official":"Aruba","common":"Aruba"},"hrv":{"official":"Aruba","common":"Aruba"},"hun":{"official":"Aruba","common":"Aruba"},"ita":{"official":"Aruba","common":"Aruba"},"jpn":{"official":"\u30a2\u30eb\u30d0","common":"\u30a2\u30eb\u30d0"},"kor":{"official":"\uc544\ub8e8\ubc14","common":"\uc544\ub8e8\ubc14"},"nld":{"official":"Aruba","common":"Aruba"},"per":{"official":"\u0622\u0631\u0648\u0628\u0627","common":"\u0622\u0631\u0648\u0628\u0627"},"pol":{"official":"Aruba","common":"Aruba"},"por":{"official":"Aruba","common":"Aruba"},"rus":{"official":"\u0410\u0440\u0443\u0431\u0430","common":"\u0410\u0440\u0443\u0431\u0430"},"slk":{"official":"Aruba","common":"Aruba"},"spa":{"official":"Aruba","common":"Aruba"},"srp":{"official":"Aruba","common":"Aruba"},"swe":{"official":"Aruba","common":"Aruba"},"tur":{"official":"Aruba","common":"Aruba"},"urd":{"official":"\u0627\u0631\u0648\u0628\u0627","common":"\u0627\u0631\u0648\u0628\u0627"},"zho":{"official":"\u963f\u9c81\u5df4","common":"\u963f\u9c81\u5df4"}},"latlng":[12.5,-69.96666666],"landlocked":false,"borders":[],"area":180,"flag":"\ud83c\udde6\ud83c\uddfc","demonyms":{"eng":{"f":"Aruban","m":"Aruban"},"fra":{"f":"Arubaise","m":"Arubais"}}},{"name":{"common":"Afghanistan","official":"IslamicRepublicofAfghanistan","native":{"prs":{"official":"\u062c\u0645\u0647\u0648\u0631\u06cc\u0627\u0633\u0644\u0627\u0645\u06cc\u0627\u0641\u063a\u0627\u0646\u0633\u062a\u0627\u0646","common":"\u0627\u0641\u063a\u0627\u0646\u0633\u062a\u0627\u0646"},"pus":{"official":"\u062f\u0627\u0641\u063a\u0627\u0646\u0633\u062a\u0627\u0646\u0627\u0633\u0644\u0627\u0645\u064a\u062c\u0645\u0647\u0648\u0631\u06cc\u062a","common":"\u0627\u0641\u063a\u0627\u0646\u0633\u062a\u0627\u0646"},"tuk":{"official":"OwganystanYslamRespublikasy","common":"Owganystan"}}},"tld":[".af"],"cca2":"AF","ccn3":"004","cca3":"AFG","cioc":"AFG","independent":true,"status":"officially-assigned","unMember":true,"unRegionalGroup":"AsiaandthePacificGroup","currencies":{"AFN":{"name":"Afghanafghani","symbol":"\u060b"}},"idd":{"root":"+9","suffixes":["3"]},"capital":["Kabul"],"altSpellings":["AF","Af\u0121\u0101nist\u0101n"],"region":"Asia","subregion":"SouthernAsia","languages":{"prs":"Dari","pus":"Pashto","tuk":"Turkmen"},"translations":{"ara":{"official":"\u062c\u0645\u0647\u0648\u0631\u064a\u0629\u0623\u0641\u0641\u0627\u0646\u0633\u062a\u0627\u0646\u0627\u0644\u0625\u0633\u0644\u0627\u0645\u064a\u0629","common":"\u0623\u0641\u063a\u0627\u0646\u0633\u062a\u0627\u0646"},"bre":{"official":"RepublikIslamekAfghanistan","common":"Afghanistan"},"ces":{"official":"Afgh\u00e1nsk\u00e1isl\u00e1msk\u00e1republika","common":"Afgh\u00e1nist\u00e1n"},"deu":{"official":"IslamischeRepublikAfghanistan","common":"Afghanistan"},"est":{"official":"AfganistaniIslamivabariik","common":"Afganistan"},"fin":{"official":"Afganistaninislamilainentasavalta","common":"Afganistan"},"fra":{"official":"R\u00e9publiqueislamiqued'Afghanistan","common":"Afghanistan"},"hrv":{"official":"IslamskaRepublikaAfganistan","common":"Afganistan"},"hun":{"official":"Afganiszt\u00e1niIszl\u00e1mK\u00f6zt\u00e1rsas\u00e1g","common":"Afganiszt\u00e1n"},"ita":{"official":"Repubblicaislamicadell'Afghanistan","common":"Afghanistan"},"jpn":{"official":"\u30a2\u30d5\u30ac\u30cb\u30b9\u30bf\u30f3\u30fb\u30a4\u30b9\u30e9\u30e0\u5171\u548c\u56fd","common":"\u30a2\u30d5\u30ac\u30cb\u30b9\u30bf\u30f3"},"kor":{"official":"\uc544\ud504\uac00\ub2c8\uc2a4\ud0c4\uc774\uc2ac\ub78c\uacf5\ud654\uad6d","common":"\uc544\ud504\uac00\ub2c8\uc2a4\ud0c4"},"nld":{"official":"IslamitischeRepubliekAfghanistan","common":"Afghanistan"},"per":{"official":"\u062c\u0645\u0647\u0648\u0631\u06cc\u0627\u0633\u0644\u0627\u0645\u06cc\u0627\u0641\u063a\u0627\u0646\u0633\u062a\u0627\u0646","common":"\u0627\u0641\u063a\u0627\u0646\u0633\u062a\u0627\u0646"},"pol":{"official":"IslamskaRepublikaAfganistanu","common":"Afganistan"},"por":{"official":"Rep\u00fablicaIsl\u00e2micadoAfeganist\u00e3o","common":"Afeganist\u00e3o"},"rus":{"official":"\u0418\u0441\u043b\u0430\u043c\u0441\u043a\u0430\u044f\u0420\
... (truncated)
CSV: N/A
TSV: N/A
YAML
chars: 641,939 tokens: 251,610 chars_og/tok: 4.5 enc_chars/tok: 2.6
<s>-altSpellings:
-AW
area:180
borders:[]
capital:
-Oranjestad
cca2:AW
cca3:ABW
ccn3:'533'
cioc:ARU
currencies:
··AWG:
····name:Arubanflorin
····symbol:ƒ
demonyms:
··eng:
····f:Aruban
····m:Aruban
··fra:
····f:Arubaise
····m:Arubais
flag:
idd:
··root:'+2'
··suffixes:
... (truncated)
TOON
chars: 691,140 tokens: 246,360 chars_og/tok: 4.6 enc_chars/tok: 2.8
<s>[250]:
-
··name:
····common:Aruba
····official:Aruba
····native:
······nld:
········official:Aruba
········common:Aruba
······pap:
········official:Aruba
········common:Aruba
··tld[1]:.aw
··cca2:AW
··ccn3:"533"
··cca3:ABW
··cioc:ARU
··independent:false
··status:officially-assigned
··unMember:false
··unRegionalGroup:""
··currencies:
····AWG:
······name:Arubanflorin
······symbol:ƒ
... (truncated)
TSON
chars: 423,383 tokens: 196,499 chars_og/tok: 5.8 enc_chars/tok: 2.2
<s>{@name(@common,official,native),tld,cca2,ccn3,cca3,cioc,independent,status,unMember,unRegionalGroup,currencies,idd(@root,suffixes),capital,altSpellings,region,subregion,languages,translations(@ara,bre,ces,deu,est,fin,fra,hrv,hun,ita,jpn,kor,nld,per,pol,por,rus,slk,spa,srp,swe,tur,urd,zho),latlng,landlocked,borders,area,flag,demonyms(@eng,fra)#250|{Aruba,Aruba,{@nld,pap|{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba}}},[.aw],AW,"533",ABW,ARU,false,officially-assigned,false,"",{@AWG|{@name,symbol|"Arubanflorin",ƒ}},{"+2",["97"]},[Oranjestad],[AW],Americas,Caribbean,{@nld,pap|Dutch,Papiamento},{{@official,common|أروبا,أروبا},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|,},{@official,common|,},{@official,common|Aruba,Aruba},{@official,common|آروبا,آروبا},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Аруба,Аруба},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|اروبا,اروبا},{@official,common|,}},[12.5,-69.96666666],false,[],180,,{{@f,m|Aruban,Aruban},{@f,m|Arubaise,Arubais}}|{Afghanistan,"IslamicRepublicofAfghanistan",{@prs,pus,tuk|{@official,common|"جمهوریاسلامیافغانستان",افغانستان},{@official,common|"دافغانستاناسلاميجمهوریت",افغانستان},{@official,common|"OwganystanYslamRespublikasy",Owganystan}}},[.af],AF,"004",AFG,AFG,true,officially-assigned,true,"AsiaandthePacificGroup",{@AFN|{@name,symbol|"Afghanafghani",}},{"+9",["3"]},[Kabul],[AF,Afġānistān],Asia,"SouthernAsia",{@prs,pus,tuk|Dari,Pashto,Turkmen},{{@official,common|"جمهوريةأففانستانالإسلامية",أفغانستان},{@official,common|"RepublikIslamekAfghanistan",Afghanistan},{@official,common|"Afghánskáislámskárepublika",Afghánistán},{@official,common|"IslamischeRepublikAfghanistan",Afghanistan},{@official,common|"AfganistaniIslamivabariik",Afganistan},{@official,common|"Afganistaninislamilainentasavalta",Afganistan},{@official,common|"Républiqueislamiqued'Afghanistan",Afghanistan},{@official,common|"IslamskaRepublikaAfganistan",Afganistan},{@official,common|"AfganisztániIszlámztársaság",Afganisztán},{@official,common|"Repubblicaislamicadell'Afghanistan",Afghanistan},{@official,common|,},{@official,common|"",},{@official,common|"IslamitischeRepubliekAfghanistan",Afghanistan},{@official,common|"جمهوریاسلامیافغانستان",افغانستان},{@official,common|"IslamskaRepublikaAfganistanu",Afganistan},{@official,common|"RepúblicaIslâmicadoAfeganistão",Afeganistão},{@official,common|"ИсламскаяРеспубликаАфганистан",Афганистан},{@official,common|"Afgánskyislamskýštát",Afganistan},{@official,common|"RepúblicaIslámicadeAfganistán",Afganistán},{@official,common|"IslamskaRepublikaAvganistan",Avganistan},{@official,common|"IslamiskarepublikenAfghanistan",Afghanistan},{@official,common|"AfganistanİslamCumhuriyeti",Afganistan},{@official,common|"اسلامیجمہوریہافغانستان",افغانستان},{@official,common|,}},[33,65],true,[IRN,PAK,TKM,UZB,TJK,CHN],652230,,{{@f,m|Afghan,Afghan},{@f,m|Afghane,Afghan}}|{Angola,"RepublicofAngola",{@por|{@official,common|"RepúblicadeAngola",Angola}}},[.ao],AO,"024",AGO,ANG,true,officially-assigned,true,"AfricanGroup",{@AOA|{@name,symbol|"Angolankwanza",Kz}},{"+2",["44"]},[Luanda],[AO,"RepúblicadeAngola","ʁɛpublikadean'ɡɔla"],Africa,"MiddleAfrica",{@por|Portuguese},{{@official,common|أنغولا,"جمهوريةأنغولا"},{@official,common|"RepublikAngola",Angola},{@official,common|"Angolskárepublika",Angola},{@official,common|"RepublikAngola",Angola},{@official,common|"AngolaVabariik",Angola},{@official,common|"Angolantasavalta",Angola},{@official,common|"Républiqued'Angola",Angola},{@official,common|"RepublikaAngola",Angola},{@official,common|Angola,Angola},{@official,common|"Repubblicadell'Angola",Angola},{@official,common|,},{@official,common|"",},{@official,common|"RepubliekAngola",Angola},{@official,common|"جمهوریآنگولا",آنگولا},{@official,common|"RepublikaAngoli",Angola},{@official,common|"RepúblicadeAngola",Angola},{@official,common|"РеспубликаАнгола",Ангола},{@official,common|"Angolskárepublika",Angola},{@official,common|"RepúblicadeAngola",Angola},{@official,common|"RepublikaAngola",Angola},{@official,common|"RepublikenAngola",Angola},{@official,common|"AngolaCumhuriyeti",Angola},{@official,common|"جمہوریہانگولہ",انگولہ},{@official,common|,}},[-12.5,18.5],false,[COG,COD,ZMB,NAM],1246700,,{{@f,m|Angolan,Angolan},{@f,m|Angolaise,Angolais}}|{Anguilla,Anguilla,{@eng|{@official,common|Anguilla,Anguilla}}},[.ai],AI,"660",AIA,"",false,officially-assigned,false,"",{@XCD
... (truncated)
minemizer
chars: 323,130 tokens: 152,369 chars_og/tok: 7.4 enc_chars/tok: 2.1
<s>name{common;official;native{...}};tld[];cca2;ccn3;cca3;cioc;independent;status;unMember;unRegionalGroup;currencies{...};idd{root;suffixes[]};capital[];altSpellings[];region;subregion;languages{...};translations{ara{official;common};bre{official;common};ces{official;common};deu{official;common};est{official;common};fin{official;common};fra{official;common};hrv{official;common};hun{official;common};ita{official;common};jpn{official;common};kor{official;common};nld{official;common};per{official;common};pol{official;common};por{official;common};rus{official;common};slk{official;common};spa{official;common};srp{official;common};swe{official;common};tur{official;common};urd{official;common};zho{official;common}};latlng[];landlocked;borders[];area;flag;demonyms{eng{f;m};fra{f;m}}
{Aruba;Aruba;{nld:{official:Aruba;common:Aruba};pap:{official:Aruba;common:Aruba}}};[.aw];AW;533;ABW;ARU;false;officially-assigned;false;;{AWG:{name:Arubanflorin;symbol:ƒ}};{+2;[97]};[Oranjestad];[AW];Americas;Caribbean;{nld:Dutch;pap:Papiamento};{{أروبا;أروبا};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{;};{;};{Aruba;Aruba};{آروبا;آروبا};{Aruba;Aruba};{Aruba;Aruba};{Аруба;Аруба};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{اروبا;اروبا};{;}};[12.5;-69.96666666];false;[];180;;{{Aruban;Aruban};{Arubaise;Arubais}}
{Afghanistan;IslamicRepublicofAfghanistan;{prs:{official:جمهوریاسلامیافغانستان;common:افغانستان};pus:{official:دافغانستاناسلاميجمهوریت;common:افغانستان};tuk:{official:OwganystanYslamRespublikasy;common:Owganystan}}};[.af];AF;004;AFG;AFG;true;officially-assigned;true;AsiaandthePacificGroup;{AFN:{name:Afghanafghani;symbol:}};{+9;[3]};[Kabul];[AF;Afġānistān];Asia;SouthernAsia;{prs:Dari;pus:Pashto;tuk:Turkmen};{{جمهوريةأففانستانالإسلامية;أفغانستان};{RepublikIslamekAfghanistan;Afghanistan};{Afghánskáislámskárepublika;Afghánistán};{IslamischeRepublikAfghanistan;Afghanistan};{AfganistaniIslamivabariik;Afganistan};{Afganistaninislamilainentasavalta;Afganistan};{Républiqueislamiqued'Afghanistan;Afghanistan};{IslamskaRepublikaAfganistan;Afganistan};{AfganisztániIszlámztársaság;Afganisztán};{Repubblicaislamicadell'Afghanistan;Afghanistan};{;};{;};{IslamitischeRepubliekAfghanistan;Afghanistan};{جمهوریاسلامیافغانستان;افغانستان};{IslamskaRepublikaAfganistanu;Afganistan};{RepúblicaIslâmicadoAfeganistão;Afeganistão};{ИсламскаяРеспубликаАфганистан;Афганистан};{Afgánskyislamskýštát;Afganistan};{RepúblicaIslámicadeAfganistán;Afganistán};{IslamskaRepublikaAvganistan;Avganistan};{IslamiskarepublikenAfghanistan;Afghanistan};{AfganistanİslamCumhuriyeti;Afganistan};{اسلامیجمہوریہافغانستان;افغانستان};{;}};[33;65];true;[IRN;PAK;TKM;UZB;TJK;CHN];652230;;{{Afghan;Afghan};{Afghane;Afghan}}
{Angola;RepublicofAngola;{por:{official:RepúblicadeAngola;common:Angola}}};[.ao];AO;024;AGO;ANG;true;officially-assigned;true;AfricanGroup;{AOA:{name:Angolankwanza;symbol:Kz}};{+2;[44]};[Luanda];[AO;RepúblicadeAngola;ʁɛpublikadean'ɡɔla];Africa;MiddleAfrica;{por:Portuguese};{{أنغولا;جمهوريةأنغولا};{RepublikAngola;Angola};{Angolskárepublika;Angola};{RepublikAngola;Angola};{AngolaVabariik;Angola};{Angolantasavalta;Angola};{Républiqued'Angola;Angola};{RepublikaAngola;Angola};{Angola;Angola};{Repubblicadell'Angola;Angola};{;};{;};{RepubliekAngola;Angola};{جمهوریآنگولا;آنگولا};{RepublikaAngoli;Angola};{RepúblicadeAngola;Angola};{РеспубликаАнгола;Ангола};{Angolskárepublika;Angola};{RepúblicadeAngola;Angola};{RepublikaAngola;Angola};{RepublikenAngola;Angola};{AngolaCumhuriyeti;Angola};{جمہوریہانگولہ;انگولہ};{;}};[-12.5;18.5];false;[COG;COD;ZMB;NAM];1246700;;{{Angolan;Angolan};{Angolaise;Angolais}}
{Anguilla;Anguilla;{eng:{official:Anguilla;common:Anguilla}}};[.ai];AI;660;AIA;;false;officially-assigned;false;;{XCD:{name:EasternCaribbeandollar;symbol:$}};{+1;[264]};[TheValley];[AI];Americas;Caribbean;{eng:English};{{أنغويلا;أنغويلا};{Anguilla;Anguilla};{Anguilla;Anguilla};{Anguilla;Anguilla};{Anguilla;Anguilla};{Anguilla;Anguilla};{Anguilla;Anguilla};{Anguilla;Angvila};{Anguilla;Anguilla};{Anguilla;Anguilla};{;};{;};{Anguilla;Anguilla};{آنگویلا;آنگویلا};{Anguilla;Anguilla};{Anguilla;Anguilla};{Ангилья;Ангилья};{Anguilla;Anguilla};{Anguila;Anguilla};{Angvila;Angvila};{Anguilla;Anguilla};{Anguilla;Anguilla};{اینگویلا;اینگویلا};{;}};[18.25;-63.16666666];false;[];91;;{{Anguillian;Anguillian};{Anguillane;Anguillan}}
{ÅlandIslands;ÅlandIslands;{swe:{official:LandskapetÅland;common:Åland}}};[.ax];AX;248;ALA;;false;officially-assigned;false;;{EUR:{name:Euro;symbol:}};{+3;[5818]};[Mariehamn];[AX;Aaland;Aland;Ahvenanmaa];Europe;NorthernEurope;{swe:Swedish};{{جزرأولاند;جزرأولاند};{IniziÅland;Åland};{Ålandskéostrovy;Ålandy};{Åland-Inseln;Åland};{Ahvenamaamaakond;Ahvenamaa};{Ahvenanmaanmaakunta;Ahvenanmaa};{Ahvenanmaa;Ahvenanmaa};{AlandIslands;Ålandskiotoci};{Åland-szigetek;Åland-szigetek};{IsoleÅland;IsoleAland};{;};{;};{Ålandeilanden;Ålandeilanden};{جزایرالند;جزایرالند};{WyspyAlandzkie;WyspyAlandzkie};{IlhasÅland;Alândia};{Аландскиеострова;Аландскиеострова};{Alandskéostrovy;Alandy};{IslasÅland;Alandia};{OlandskaOstrva;OlandskaOstrva};{Åland;Åland};{ÅlandAdaları;Åland};{جزائراولند;جزائراولند};{;}};[60.116667;19.9];false;[];1580;;{{Ålandish;Ålandish};{Ålandaise;Ålandais}}
{Albania;RepublicofAlbania;{sqi:{official:RepublikaeShqipërisë;common:Shqipëria}}};[.al];AL;008;ALB;ALB;true;officially-assigned;true;EasternEuropeanGroup;{ALL:{name:Albanianlek;symbol:L}};{+3;[55]};[Tirana];[AL;Shqipëri;Shqipëria;Shqipnia];Europe;SoutheastEurope;{sqi:Albanian};{{جمهوريةألبانيا;ألبانيا};{RepublikAlbania;Albania};{Albánskárepublika;Albánie};{RepublikAlbanien;Albanien};{AlbaaniaVabariik;Albaania};{Albaniantasavalta;Albania};{Républiqued'Albanie;Albanie};{RepublikaAlbanija;Albanija};{Albánztársaság;Albánia};{Repubblicad'Albania;Albania};{;};{;};{RepubliekAlban;Alban};{جمهوریآلبانی;آلبانی};{RepublikaAlbanii;Albania};{RepúblicadaAlbânia;Albânia};{РеспубликаАлбания;Албания};{Albánskarepublika;Albánsko};{RepúblicadeAlbania;Albania};{RepublikaAlbanija;Albanija};{RepublikenAlbanien;Albanien};{ArnavutlukCumhuriyeti;Arnavutluk};{جمہوریہالبانیا;البانیا};{;}};[41;20];false;[MNE;GRC;MKD;UNK];28748;;{{Albanian;Albanian};{Albanaise;Albanais}}
{Andorra;PrincipalityofAndorra;{cat:{official:Principatd'Andorra;common:Andorra}}};[.ad];AD;020;AND;AND;true;officially-assigned;true;WesternEuropeanandOthersGroup;{EUR:{name:Euro;symbol:}};{+3;[76]};[AndorralaVella];[AD;PrincipalityofAndorra;Principatd'Andorra];Europe;SouthernEurope;{cat:Catalan};{{إمارةأندورا;أندورا};{PriñselezhAndorra;Andorra};{Andorrskéknížect;Andorra};{FürstentumAndorra;Andorra};{AndorraVürstiriik;Andorra};{Andorranruhtinaskunta;Andorra};{Principautéd'Andorre;Andorre};{KneževinaAndora;Andora};{Andorra;Andorra};{PrincipatodiAndorra;Andorra};{;};{;};{PrinsdomAndorra;Andorra};{شاهزادهنشینآندورا;آندورا};{KsięstwoAndory;Andora};{PrincipadodeAndorra;Andorra};{КняжествоАндорра;Андорра};{Andorrskékniežatstvo;Andorra};{PrincipadodeAndorra;Andorra};{KneževinaAndora;Andora};{FurstendömetAndorra;Andorra};{AndorraPrensliği;Andorra};{اماراتِانورا;انورا};{;}};[42.5;1.5];true;[FRA;ESP];468;;{{Andorran;Andorran};{Andorrane;Andorran}}
{UnitedArabEmirates;UnitedArabEmirates;{ara:{official:الإماراتالعربيةالمتحدة;common:الإمارات}}};[.ae;امارات.];AE;784;ARE;UAE;true;officially-assigned;true;AsiaandthePacificGroup;{AED:{name:UnitedArabEmiratesdirham;symbol:د.إ}};{+9;[71]};[AbuDhabi];[AE;UAE;Emirates];Asia;WesternAsia;{ara:Arabic};{{الإماراتالعربيةالمتحدة;الإمارات};{EmirelezhioùArabUnanet;EmirelezhioùArabUnanet};{Spojenéarabskéemiráty;Spojenéarabskéemiráty};{VereinigteArabischeEmirate;VereinigteArabischeEmirate};{AraabiaÜhendemiraadid;AraabiaÜhendemiraadid};{Yhdistyneetarabiemiirikunnat;Arabiemiraatit};{Émiratsarabesunis;Émiratsarabesunis};{UjedinjeniArapskiEmirati;UjedinjeniArapskiEmirati};{EgyesültArabEmírségek;EgyesültArabEmírségek};{EmiratiArabiUniti;EmiratiArabiUniti};{;UAE};{;};{VerenigdeArabischeEmiraten;VerenigdeArabischeEmiraten};{اماراتمتحدهعربی;امارات};{ZjednoczoneEmiratyArabskie;ZjednoczoneEmiratyArabskie};{EmiradosÁrabesUnidos;EmiradosÁrabesUnidos};{ОбъединенныеАрабскиеЭмираты;ОбъединённыеАрабскиеЭмираты};{Spojenéarabskéemiráty;Spojenéarabskéemiráty};{EmiratosÁrabesUnidos;EmiratosÁrabesUnidos};{UjedinjeniArapskiEmirati;UjedinjeniArapskiEmirati};{FörenadeArabemiraten;FörenadeArabemiraten};{BirleşikArapEmirlikleri;BirleşikArapEmirlikleri};{متحدہعربامارات;متحدہعربامارات};{;}};[24;54];false;[OMN;SAU];83600;;{{Emirati;Emirati};{Emirienne;Emirien}}
{Argentina;ArgentineRepublic;{grn:{official:ArgentineRepublic;common:Argentina};spa:{official:RepúblicaArgentina;common:Argentina}}};[.ar];AR;032;ARG;ARG;true;officially-assigned;true;LatinAmericanandCaribbeanGroup;{ARS:{name:Argentinepeso;symbol:$}};{+5;[4]};[BuenosAires];[AR;ArgentineRepublic;RepúblicaArgentina];Americas;SouthAmerica;{grn:Guaraní;spa:Spanish};{{جمهوريةالأرجنتين;الأرجنتين};{RepublikArc'hantina;Arc'hantina};{Argentinskárepublika;Argentina};{ArgentinischeRepublik;Argentinien};{ArgentinaVabariik;Argentina};{Argentiinantasavalta;Argentiina};{Républiqueargentine;Argentine};{ArgentinskiRepublika;Argentina};{Argentinztársaság;Argentína};{RepubblicaArgentina;Argentina};{;};{;};{ArgentijnseRepubliek;Argentinië};{جمهوریآرانتین;آرانتین};{RepublikaArgentyńska;Argentyna};{RepúblicaArgentina;Argentina};{АргентинскаяРеспублика;Аргентина};{Argentínskarepublika;Argentína};{RepúblicaArgentina;Argentina};{RepublikaArgentina;Argentina};{RepublikenArgentina;Argentina};{ArjantinCumhuriyeti;Arjantin};{جمہوریہارجنائن;ارجنائن};{;}};[-34;-64];false;[BOL;BRA;CHL;PRY;URY];2780400;;{{Argentine;Argentine};{Argentine;Argentin}}
{Armenia;RepublicofArmenia;{hye:{official:ՀայաստանիՀանրապետություն;common:Հայաստան}}};[.am];AM;051;ARM;ARM;true;officially-assigned;true;EasternEuropeanGroup;{AMD:{name:Armeniandram;symbol:}};{+3;[74]};[Yerevan];[AM;Hayastan;RepublicofArmenia;ՀայաստանիՀանրապետություն];Asia;WesternAsia;{hye:Armenian};{{جمهوريةأرمينيا;أرمينيا};{RepublikArmenia;Armenia};{Arménskárepublika;Arménie};{RepublikArmenien;Armenien};{ArmeeniaVabariik;Armeenia};{Armeniantasavalta;Armenia};{Républiqued'Arménie;Arménie};{RepublikaArmenija;Armenija};{Örményország;Örményország};{RepubblicadiArmenia;Armenia};{;};{;};{RepubliekArmen;Armen};{جمهوریارمنستان;ارمنستان};{RepublikaArmenii;Armenia};{RepúblicadaArménia;Arménia};{РеспубликаАрмения;Армения};{Arménskarepublika;Arménsko};{RepúblicadeArmenia;Armenia};{RepublikaJermenija;Jermenija};{RepublikenArmenien;Armenien};{ErmenistanCumhuriyeti;Ermenistan};{جمہوریہآرمینیا;آرمینیا};{;}};[40;45];true;[AZE;GEO;IRN;TUR];29743;;{{Armenian;Armenian};{Arménienne;Arménien}}
{AmericanSamoa;AmericanSamoa;{eng:{official:AmericanSamoa;common:AmericanSamoa};smo:{official:SāmoaAmelika;common:SāmoaAmelika}}};[.as];AS;016;ASM;ASA;false;officially-assigned;false;;{USD:{name:UnitedStatesdollar;symbol:$}};{+1;[684]};[PagoPago];[AS;AmerikaSāmoa;AmelikaSāmoa;SāmoaAmelika];Oceania;Polynesia;{eng:English;smo:Samoan};{{سامواالأمريكية;سامواالأمريكية};{SamoaAmerikan;SamoaAmerikan};{AmerickáSamoa;AmerickáSamoa};{Amerikanisch-Samoa;Amerikanisch-Samoa};{AmeerikaSamoa;AmeerikaSamoa};{AmerikanSamoa;AmerikanSamoa};{Samoaaméricaines;Samoaaméricaines};{amerkaSamoa;AmerkaSamoa};{Szamoa;Szamoa};{Samoaamericane;SamoaAmericane};{;};{;};{AmerikaansSamoa;AmerikaansSamoa};{ساموآیآمریکا;ساموآیآمریکا};{SamoaAmerykańskie;SamoaAmerykańskie};{Samoaamericana;SamoaAmericana};{американскоеСамоа;АмериканскоеСамоа};{AmerickáSamoa;AmerickáSamoa};{SamoaAmericana;SamoaAmericana};{AmerkaSamoa;AmerkaSamoa};{AmerikanskaSamoa;AmerikanskaSamoa};{AmerikanSamoası;AmerikanSamoası};{امریکیسمووا;امریکیسمووا};{;}};[-14.33333333;-170];false;[];199;;{{AmericanSamoan;AmericanSamoan};{Samoane;Samoan}}
{Antarctica;Antarctica;{}};[.aq];AQ;010;ATA;;false;officially-assigned;false;;{};{;[]};[];[AQ];Antarctic;;{};{{أنتارتيكا;أنتارتيكا};{Antarktika;Antarktika};{Antarktida;Antarktida};{Antarktika;Antarktis};{Antarktika;Antarktika};{Etelämanner;Etelämanner};{Antarctique;Antarctique};{Antarktika;Antarktika};{Antarktisz;Antarktisz};{Antartide;Antartide};{;};{;};{Antarctica;Antarctica};{جنوبگان;جنوبگان};{Antarktyka;Antarktyka};{Antártica;Antártida};{Антарктида;Антарктида};{Antarktída;Antarktída};{Antártida;Antártida};{Antarktik;Antarktik};{Antarktis;Antarktis};{Antarktika;Antarktika};{انارککا;انارککا};{;}};[-90;0];false;[];14000000;;{{Antarctican;Antarctican};{Antarcticaine;Antarcticain}}
{FrenchSouthernandAntarcticLands;TerritoryoftheFrenchSouthernandAntarcticLands;{fra:{official:TerritoiredesTerresaustralesetantarctiquesfrançaises;common:Terresaustralesetantarctiquesfrançaises}}};[.tf];TF;260;ATF;;false;officially-assigned;false;;{EUR:{name:Euro;symbol:}};{+2;[62]};[Port-aux-Français];[TF;FrenchSouthernTerritories];Antarctic;;{fra:French};{{مقاطعاتوأقاليمماوراءالبحارالفرنسية;أراضفرنسيةجنوبيةوأنتارتيكية};{TiriadDouaroùAostralhagAntarktikelFrañs;DouaroùAostralhagAntarktikelFrañs};{TeritoriumFrancouzskájižaantarktickáúzemí;Francouzskájižaantarktickáúzemí};{GebietderFranzösischSüd-undAntarktisgebiete;FranzösischeSüd-undAntarktisgebiete};{PrantsuseLõunaalad;PrantsuseLõunaalad};{Ranskaneteläisetjaantarktisetalueet;Ranskaneteläisetjaantarktisetalueet};{TerritoiredesTerresaustralesetantarctiquesfrançaises;Terresaustralesetantarctiquesfrançaises};{TeritorijuFrancuskijužniiantarktičkiteritoriji;Francuskijužniiantarktičkiteritoriji};{Francialiésantarktisziterületek;Francialiésantarktisziterületek};{TerritoriodellaaustralieantartichefrancesiTerre;TerritoriFrancesidelSud};{;};{;};{GrondgebiedvandeFranseZuidelijkeenAntarctischegebieden;FranseGebiedenindezuidelijkeIndischeOceaan};{سرزمینهایجنوبیوجنوبگانیفرانسه;سرزمینهایجنوبیوجنوبگانیفرانسه};{FrancuskieTerytoriaPołudnioweiAntarktyczne;FrancuskieTerytoriaPołudnioweiAntarktyczne};{TerritóriodoSuleAntárticaFrancesa;TerrasAustraiseAntárticasFrancesas};{ТерриторияФранцузскиеЮжныеиАнтарктическиеземли;ФранцузскиеЮжныеиАнтарктическиетерритории};{Francúzskejužaantarktickéúzemia;FrancúzskejuŽaantarktickéúzemia};{TerritoriodelFrancésTierrasaustralesyantárticas;TierrasAustralesyAntárticasFrancesas};{Francuskejužneiantarktičkezemlje;Francuskejužneiantarktičkezemlje};{Franskasyd-ochAntarktisterritorierna;Franskasödraterritorierna};{FransızneyveAntarktikaToprakları;FransızneyveAntarktikaToprakları};{سرزمینِجنوبیفرانسیسیہوانارکیکہ;سرزمینجنوبیفرانسیسیہوانارکیکا};{;}};[-49.25;69.167];false;[];7747;;{{French;French};{Française;Français}}
{AntiguaandBarbuda;AntiguaandBarbuda;{eng:{official:AntiguaandBarbuda;common:AntiguaandBarbuda}}};[.ag];AG;028;ATG;ANT;true;officially-assigned;true;LatinAmericanandCaribbeanGroup;{XCD:{name:EasternCaribbeandollar;symbol:$}};{+1;[268]};[SaintJohn's];[AG];Americas;Caribbean;{eng:English};{{أنتيغواوباربودا;أنتيغواوباربودا};{AntiguahaBarbuda;AntiguahaBarbuda};{AntiguaaBarbuda;AntiguaaBarbuda};{AntiguaundBarbuda;AntiguaundBarbuda};{AntiguajaBarbuda;AntiguajaBarbuda};{AntiguajaBarbuda;AntiguajaBarbuda};{Antigua-et-Barbuda;Antigua-et-Barbuda};{AntigvaiBarbuda;AntigvaiBarbuda};{AntiguaésBarbuda;AntiguaésBarbuda};{AntiguaeBarbuda;AntiguaeBarbuda};{;};{;};{AntiguaenBarbuda;AntiguaenBarbuda};{آنتیگواوباربودا;آنتیگواوباربودا};{AntiguaiBarbuda;AntiguaiBarbuda};{AntiguaeBarbuda;AntíguaeBarbuda};{АнтигуаиБарбуда;АнтигуаиБарбуда};{AntiguaaBarbuda;AntiguaaBarbuda};{AntiguayBarbuda;AntiguayBarbuda};{AntigvaiBarbuda;AntigvaiBarbuda};{AntiguaochBarbuda;AntiguaochBarbuda};{AntiguaveBarbuda;AntiguaveBarbuda};{اینیگواوباربوا;اینیگواوباربوا};{;}};[17.05;-61.8];false;[];442;;{{Antiguan,Barbudan;Antiguan,Barbudan};{Antiguaiseetbarbudienne;Antiguaiseetbarbudien}}
{Australia;CommonwealthofAustralia;{eng:{official:CommonwealthofAustralia;common:Australia}}};[.au];AU;036;AUS;AUS;true;officially-assigned;true;WesternEuropeanandOthersGroup;{AUD:{name:Australiandollar;symbol:$}};{+6;[1]};[Canberra];[AU];Oceania;AustraliaandNewZealand;{eng:English};{{كومونولثأستراليا;أستراليا};{KengladAostralia;Aostralia};{Australskéspolečenství;Austrálie};{CommonwealthAustralien;Australien};{AustraaliaÜhendus;Austraalia};{Australianliittovaltio;Australia};{Australie;Australie};{CommonwealthofAustralia;Australija};{AusztrálÁllamszövetség;Ausztrália};{Commonwealthdell'Australia;Australia};{;};{;};{GemenebestvanAustral;Austral};{قلمروهمسوداسترالیا;استرالیا};{ZwiązekAustralijski;Australia};{ComunidadedaAustrália;Austrália};{СодружествоАвстралии;Австралия};{Austrálskyzz;Austrália};{MancomunidaddeAustralia;Australia};{KomonveltAustralija;Australija};{Australiskastatsförbundet;Australien};{AvustralyaFederalDevleti;Avustralya};{دولتِمشترکہآسریلیا;آسریلیا};{;}};[-27;133];false;[];7692024;;{{Australian;Australian};{Australienne;Australien}}
{Austria;RepublicofAustria;{bar:{official:RepublikÖsterreich;common:Österreich}}};[.at];AT;040;AUT;AUT;true;officially-assigned;true;WesternEuropeanandOthersGroup;{EUR:{name:Euro;symbol:}};{+4;[3]};[Vienna];[AT;Osterreich;Oesterreich];Europe;CentralEurope;{bar:Austro-BavarianGerman};{{جمهوريةالنمسا;النمسا};{RepublikAostria;Aostria};{Rakousrepublika;Rakousko};{RepublikÖsterreich;Österreich};{AustriaVabariik;Austria};{Itävallantasavalta;Itävalta};{Républiqued'Autriche;Autriche};{RepublikaAustrija;Austrija};{Ausztria;Ausztria};{Repubblicad'Austria;Austria};{;};{;};{RepubliekOostenrijk;Oostenrijk};{جمهوریاتریش;اتریش};{RepublikaAustrii;Austria};{RepúblicadaÁustria;Áustria};{АвстрийскаяРеспублика;Австрия};{Rakúskarepublika;Rakúsko};{RepúblicadeAustria;Austria};{RepublikaAustrija;Austrija};{RepublikenÖsterrike;Österrike};{AvusturyaCumhuriyeti;Avusturya};{جمہوریہآسریا;آسریا};{;}};[47.33333333;13.33333333];true;[CZE;DEU;HUN;ITA;LIE;SVK;SVN;CHE];83871;;{{Austrian;Austrian};{Autrichienne;Autrichien}}
{Azerbaijan;RepublicofAzerbaijan;{aze:{official:AzərbaycanRespublikası;common:Azərbaycan};rus:{official:АзербайджанскаяРеспублика;common:Азербайджан}}};[.az];AZ;031;AZE;AZE;true;officially-assigned;true;EasternEuropeanGroup;{AZN:{name:Azerbaijanimanat;symbol:}};{+9;[94]};[Baku];[AZ;RepublicofAzerbaijan;AzərbaycanRespublikası];Asia;WesternAsia;{aze:Azerbaijani;rus:Russian};{{جمهوريةأذربيجان;أذربيجان};{RepublikAzerbaidjan;Azerbaidjan};{Ázerbájdžánskárepublika;Ázerbájdžán};{RepublikAserbaidschan;Aserbaidschan};{AserbaidžaaniVabariik;Aserbaidžaan};{Azerbaidzanintasavalta;Azerbaidzan};{Républiqued'Azerbaïdjan;Azerbaïdjan};{RepublikaAzerbajdžan;Azerbajdžan};{Azerbajdzsán;Azerbajdzsán};{Repubblicadell'Azerbaigian;Azerbaijan};{;};{;};{RepubliekAzerbeidzjan;Azerbeidzjan};{جمهوریآذربایجان;جمهوریآذربایجان};{RepublikaAzerbejdżanu;Azerbejdżan};{RepúblicadoAzerbaijão;Azerbeijão};{АзербайджанскаяРеспублика;Азербайджан};{Azerbajanskárepublika;Azerbajan};{RepúblicadeAzerbaiyán;Azerbaiyán};{RepublikaAzerbejdžan;Azerbejdžan};{RepublikenAzerbajdzjan;Azerbajdzjan};{AzerbaycanCumhuriyeti;Azerbaycan};{جمہوریہآذربائیجان;آذربائیجان};{;}};[40.5;47.5];true;[ARM;GEO;IRN;RUS;TUR];86600;;{{Azerbaijani;Azerbaijani};{Azerbaïdjanaise;Azerbaïdjanais}}
{Burundi;RepublicofBurundi;{fra:{official:RépubliqueduBurundi;common:Burundi};run:{official:Republikay'Uburundi;common:Uburundi}}};[.bi];BI;108;BDI;BDI;true;officially-assigned;true;AfricanGroup;{BIF:{name:Burundianfranc;symbol:Fr}};{+2;[57]};[Gitega];[BI;RepublicofBurundi;Republikay'Uburundi;RépubliqueduBurundi];Africa;EasternAfrica;{fra:French;run:Kirundi};{{جمهوريةبوروندي;بوروندي};{RepublikBurundi;Burundi};{Burundskárepublika;Burundi};{RepublikBurundi;Burundi};{BurundiVabariik;Burundi};{Burundintasavalta;Burundi};{RépubliqueduBurundi;Burundi};{Burundi;Burundi};{Burundi;Burundi};{RepubblicadelBurundi;Burundi};{;};{;};{RepubliekBurundi;Burundi};{جمهوریبوروندی;بوروندی};{RepublikaBurundi;Burundi};{RepúblicadoBurundi;Burundi};{РеспубликаБурунди;Бурунди};{Burundskárepublika;Burundi};{RepúblicadeBurundi;Burundi};{RepublikaBurundi;Burundi};{RepublikenBurundi;Burundi};{BurundiCumhuriyeti;Burundi};{جمہوریہبرونی;برونی};{;}};[-3.5;30];true;[COD;RWA;TZA];27834;;{{Burundian;Burundian};{Burundaise;Burundais}}
{Belgium;KingdomofBelgium;{deu:{official:KönigreichBelgien;common:Belgien};fra:{official:RoyaumedeBelgique;common:Belgique};nld:{official:KoninkrijkBelgië;common:België}}};[.be];BE;056;BEL;BEL;true;officially-assigned;true;WesternEuropeanandOthersGroup;{EUR:{name:Euro;symbol:}};{+3;[2]};[Brussels];[BE;België;Belgie;Belgien;Belgique;KingdomofBelgium;KoninkrijkBelgië;RoyaumedeBelgique;KönigreichBelgien];Europe;WesternEurope;{deu:German;fra:French;nld:Dutch};{{مملكةبلجيكا;بلجيكا};{RouantelezhBelgia;Belgia};{Belgickéklovství;Belgie};{KönigreichBelgien;Belgien};{BelgiaKuningriik;Belgia};{Belgiankuningaskunta;Belgia};{RoyaumedeBelgique;Belgique};{KraljevinaBelgija;Belgija};{BelgaKirályság;Belgium};{RegnodelBelgio;Belgio};{;};{;};{KoninkrijkBelgië;België};{پادشاهیبلیک;بلیک};{KrólestwoBelgii;Belgia};{ReinodaBélgica;Bélgica};{КоролевствоБельгия;Бельгия};{Belgickékľovstvo;Belgicko};{ReinodeBélgica;Bélgica};{KraljevinaBelgija;Belgija};{KonungariketBelgien;Belgien};{BelçikaKrallığı;Belçika};{مملکتِبلجئیم;بلجئیم};{;}};[50.83333333;4];false;[FRA;DEU;LUX;NLD];30528;;{{Belgian;Belgian};{Belge;Belge}}
{Benin;RepublicofBenin;{fra:{official:RépubliqueduBénin;common:Bénin}}};[.bj];BJ;204;BEN;BEN;true;officially-assigned;true;AfricanGroup;{XOF:{name:WestAfricanCFAfranc;symbol:Fr}};{+2;[29]};[Porto-Novo];[BJ;RepublicofBenin;RépubliqueduBénin];Africa;WesternAfrica;{fra:French};{{جمهوريةبنين;بنين};{RepublikBenin;Benin};{Beninskárepublika;Benin};{RepublikBenin;Benin};{BeniniVabariik;Benin};{Beninintasavalta;Benin};{RépubliqueduBénin;Bénin};{RepublikaBenin;Benin};{Beniniztársaság;Benin};{RepubblicadelBenin;Benin};{;};{;};{RepubliekBenin;Benin};{جمهوریبنین;بنین};{Benin;Benin};{RepúblicadoBenin;Benin};{РеспубликаБенин;Бенин};{Beninskárepublika;Benin};{RepúblicadeBenin;Benín};{RepublikaBenin;Benin};{RepublikenBenin;Benin};{BeninCumhuriyeti;Benin};{جمہوریہبینن;بینن};{;}};[9.5;2.25];false;[BFA;NER;NGA;TGO];112622;;{{Beninese;Beninese};{Béninoise;Béninois}}
{BurkinaFaso;BurkinaFaso;{fra:{official:RépubliqueduBurkina;common:BurkinaFaso}}};[.bf];BF;854;BFA;BUR;true;officially-assigned;true;AfricanGroup;{XOF:{name:WestAfricanCFAfranc;symbol:Fr}};{+2;[26]};[Ouagadougou];[BF];Africa;WesternAfrica;{fra:French};{{بوركينافاسو;بوركينافاسو};{BurkinaFaso;BurkinaFaso};{BurkinaFaso;BurkinaFaso};{BurkinaFaso;BurkinaFaso};{BurkinaFaso;BurkinaFaso};{BurkinaFaso;BurkinaFaso};{RépubliqueduBurkina;BurkinaFaso};{BurkinaFaso;BurkinaFaso};{BurkinaFaso;Burkina};{BurkinaFaso;BurkinaFaso};{;};{;};{BurkinaFaso;BurkinaFaso};{بورکینافاسو;بورکینافاسو};{BurkinaFaso;BurkinaFaso};{BurkinaFaso;BurkinaFaso};{Буркина-Фасо;Буркина-Фасо};{BurkinaFaso;BurkinaFaso};{BurkinaFaso;BurkinaFaso};{BurkinaFaso;BurkinaFaso};{BurkinaFaso;BurkinaFaso};{BurkinaFaso;BurkinaFaso};{برکینافاسو;برکینافاسو};{;}};[13;-2];true;[BEN;CIV;GHA;MLI;NER;TGO];272967;;{{Burkinabe;Burkinabe};{Burkinabée;Burkinabé}}
{Bangladesh;People'sRepublicofBangladesh;{ben:{official:;common:}}};[.bd];BD;050;BGD;BAN;true;officially-assigned;true;AsiaandthePacificGroup;{BDT:{name:Bangladeshitaka;symbol:}};{+8;[80]};[Dhaka];[BD;People'sRepublicofBangladesh;GônôprôjatôntriBangladesh];Asia;SouthernAsia;{ben:Bengali};{{جمهوريةبنغلاديشالشعبية;بنغلاديش};{RepublikpoblBangladesh;Bangladesh};{Bangladéšskálidovárepublika;Bangladéš};{VolksrepublikBangladesch;Bangladesch};{BangladeshiRahvavabariik;Bangladesh};{Bangladeshinkansantasavalta;Bangladesh};{LaRépubliquepopulaireduBangladesh;Bangladesh};{NarodnaRepublikaBangladeš;Bangladeš};{Banglades;Banglades};{RepubblicapopolaredelBangladesh;Bangladesh};{;};{;};{VolksrepubliekBangladesh;Bangladesh};{جمهوریخلقبنگلادش;بنگلادش};{LudowaRepublikaBangladeszu;Bangladesz};{RepúblicaPopulardoBangladesh;Bangladesh};{НароднаяРеспубликаБангладеш;Бангладеш};{Bangladéšskaľudovárepublika;Bangladéš};{RepúblicaPopulardeBangladesh;Bangladesh};{NarodnaRepublikaBangladeš;Bangladeš};{FolkrepublikenBangladesh;Bangladesh};{BangladeşHalkCumhuriyeti;Bangladeş};{عوامیجمہوریہبنگلہدیش;بنگلہدیش};{;}};[24;90];false;[MMR;IND];147570;;{{Bangladeshi;Bangladeshi};{Bangladaise;Bangladais}}
{Bulgaria;RepublicofBulgaria;{bul:{official:РепубликаБългария;common:България}}};[.bg];BG;100;BGR;BUL;true;officially-assigned;true;EasternEuropeanGroup;{BGN:{name:Bulgarianlev;symbol:лв}};{+3;[59]};[Sofia];[BG;RepublicofBulgaria;РепубликаБългария];Europe;SoutheastEurope;{bul:Bulgarian};{{جمهوريةبلغاريا;بلغاريا};{RepublikBulgaria;Bulgaria};{Bulharskárepublika;Bulharsko};{RepublikBulgarien;Bulgarien};{BulgaariaVabariik;Bulgaaria};{Bulgariantasavalta;Bulgaria};{RépubliquedeBulgarie;Bulgarie};{RepublikaBugarska;Bugarska};{Bolgárztársaság;Bulgária};{RepubblicadiBulgaria;Bulgaria};{;};{;};{RepubliekBulgarije;Bulgarije};{جمهوریبلغارستان;بلغارستان};{RepublikaBułgarii;Bułgaria};{RepúblicadaBulgária;Bulgária};{РеспубликаБолгария;Болгария};{Bulharskárepublika;Bulharsko};{RepúblicadeBulgaria;Bulgaria};{RepublikaBugarska;Bugarska};{RepublikenBulgarien;Bulgarien};{BulgaristanCumhuriyeti;Bulgaristan};{جمہوریہبلغاریہ;بلغاریہ};{;}};[43;25];false;[GRC;MKD;ROU;SRB;TUR];110879;;{{Bulgarian;Bulgarian};{Bulgare;Bulgare}}
{Bahrain;KingdomofBahrain;{ara:{official:مملكةالبحرين;common:البحرين}}};[.bh];BH;048;BHR;BRN;true;officially-assigned;true;AsiaandthePacificGroup;{BHD:{name:Bahrainidinar;symbol:.د.ب}};{+9;[73]};[Manama];[BH;KingdomofBahrain;Mamlakatal-Barayn];Asia;WesternAsia;{ara:Arabic};{{مملكةالبحرين;البحرين};{RouantelezhBahrein;Bahrein};{KlovstvíBahrajn;Bahrajn};{KönigreichBahrain;Bahrain};{BahreiniKuningriik;Bahrein};{Bahraininkuningaskunta;Bahrain};{RoyaumedeBahreïn;Bahreïn};{KraljevinaBahrein;Bahrein};{BahreiniKirályság;Bahrein};{RegnodelBahrain;Bahrein};{;};{;};{KoninkrijkBahrein;Bahrein};{پادشاهیبحرین;بحرین};{KrólestwoBahrajnu;Bahrajn};{ReinodoBahrein;Bahrein};{КоролевствоБахрейн;Бахрейн};{Bahrajnskékľovstvo;Bahrajn};{ReinodeBahrein;Bahrein};{KraljevinaBahrein;Bahrein};{KonungariketBahrain;Bahrain};{BahreynKrallığı;Bahreyn};{مملکتِبحرین;بحرین};{;}};[26;50.55];false;[];765;;{{Bahraini;Bahraini};{Bahreïnienne;Bahreïnien}}
... (truncated)
minemizer (compact)
chars: 299,485 tokens: 156,354 chars_og/tok: 7.3 enc_chars/tok: 1.9
<s>name{common;official;native{...}};tld[];cca2;ccn3;cca3;cioc;independent;status;unMember;unRegionalGroup;currencies{...};idd{root;suffixes[]};capital[];altSpellings[];region;subregion;languages{...};translations{ara{official;common};bre{official;common};ces{official;common};deu{official;common};est{official;common};fin{official;common};fra{official;common};hrv{official;common};hun{official;common};ita{official;common};jpn{official;common};kor{official;common};nld{official;common};per{official;common};pol{official;common};por{official;common};rus{official;common};slk{official;common};spa{official;common};srp{official;common};swe{official;common};tur{official;common};urd{official;common};zho{official;common}};latlng[];landlocked;borders[];area;flag;demonyms{eng{f;m};fra{f;m}}
{Aruba;Aruba;{nld:{official:Aruba;common:Aruba};pap:{official:Aruba;common:Aruba}}};[.aw];AW;533;ABW;ARU;false;officially-assigned;false;;{AWG:{name:Arubanflorin;symbol:ƒ}};{+2;[97]};[Oranjestad];[AW];Americas;Caribbean;{nld:Dutch;pap:Papiamento};{{أروبا;أروبا};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{;};{;};{Aruba;Aruba};{آروبا;آروبا};{Aruba;Aruba};{Aruba;Aruba};{Аруба;Аруба};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{اروبا;اروبا};{;}};[12.5;-69.96666666];false;[];180;;{{Aruban;Aruban};{Arubaise;Arubais}}
{Afghanistan;IslamicRepublicofAfghanistan;{prs:{official:جمهوریاسلامیافغانستان;common:افغانستان};pus:{official:دافغانستاناسلاميجمهوریت;common:افغانستان};tuk:{official:OwganystanYslamRespublikasy;common:Owganystan}}};[.af];AF;004;AFG;AFG;true;officially-assigned;true;AsiaandthePacificGroup;{AFN:{name:Afghanafghani;symbol:}};{+9;[3]};[Kabul];[AF;Afġānistān];Asia;SouthernAsia;{prs:Dari;pus:Pashto;tuk:Turkmen};{{جمهوريةأففانستانالإسلامية;أفغانستان};{RepublikIslamekAfghanistan;Afghanistan};{Afghánskáislámskárepublika;Afghánistán};{IslamischeRepublikAfghanistan;Afghanistan};{AfganistaniIslamivabariik;Afganistan};{Afganistaninislamilainentasavalta;Afganistan};{Républiqueislamiqued'Afghanistan;Afghanistan};{IslamskaRepublikaAfganistan;Afganistan};{AfganisztániIszlámztársaság;Afganisztán};{Repubblicaislamicadell'Afghanistan;Afghanistan};{;};{;};{IslamitischeRepubliekAfghanistan;Afghanistan};{جمهوریاسلامیافغانستان;افغانستان};{IslamskaRepublikaAfganistanu;Afganistan};{RepúblicaIslâmicadoAfeganistão;Afeganistão};{ИсламскаяРеспубликаАфганистан;Афганистан};{Afgánskyislamskýštát;Afganistan};{RepúblicaIslámicadeAfganistán;Afganistán};{IslamskaRepublikaAvganistan;Avganistan};{IslamiskarepublikenAfghanistan;Afghanistan};{AfganistanİslamCumhuriyeti;Afganistan};{اسلامیجمہوریہافغانستان;افغانستان};{;}};[33;65];true;[IRN;PAK;TKM;UZB;TJK;CHN];652230;;{{Afghan;Afghan};{Afghane;Afghan}}
{Angola;RepublicofAngola;{por:{official:RepúblicadeAngola;common:Angola}}};[.ao];AO;024;AGO;ANG;true;officially-assigned;true;AfricanGroup;{AOA:{name:Angolankwanza;symbol:Kz}};{+2;[44]};[Luanda];[AO;RepúblicadeAngola;ʁɛpublikadean'ɡɔla];Africa;MiddleAfrica;{por:Portuguese};{{أنغولا;جمهوريةأنغولا};{RepublikAngola;Angola};{Angolskárepublika;Angola};{RepublikAngola;Angola};{AngolaVabariik;Angola};{Angolantasavalta;Angola};{Républiqued'Angola;Angola};{RepublikaAngola;Angola};{Angola;Angola};{Repubblicadell'Angola;Angola};{;};{;};{RepubliekAngola;Angola};{جمهوریآنگولا;آنگولا};{RepublikaAngoli;Angola};{RepúblicadeAngola;Angola};{РеспубликаАнгола;Ангола};{Angolskárepublika;Angola};{RepúblicadeAngola;Angola};{RepublikaAngola;Angola};{RepublikenAngola;Angola};{AngolaCumhuriyeti;Angola};{جمہوریہانگولہ;انگولہ};{;}};[-12.5;18.5];false;[COG;COD;ZMB;NAM];1246700;;{{Angolan;Angolan};{Angolaise;Angolais}}
{Anguilla;Anguilla;{eng:{official:Anguilla;common:Anguilla}}};[.ai];AI;660;AIA;;false;officially-assigned;false;;{XCD:{name:EasternCaribbeandollar;symbol:$}};{+1;[264]};[TheValley];[AI];Americas;Caribbean;{eng:English};{{أنغويلا;أنغويلا};{Anguilla;Anguilla};{Anguilla;Anguilla};{Anguilla;Anguilla};{Anguilla;Anguilla};{Anguilla;Anguilla};{Anguilla;Anguilla};{Anguilla;Angvila};{Anguilla;Anguilla};{Anguilla;Anguilla};{;};{;};{Anguilla;Anguilla};{آنگویلا;آنگویلا};{Anguilla;Anguilla};{Anguilla;Anguilla};{Ангилья;Ангилья};{Anguilla;Anguilla};{Anguila;Anguilla};{Angvila;Angvila};{Anguilla;Anguilla};{Anguilla;Anguilla};{اینگویلا;اینگویلا};{;}};[18.25;-63.16666666];false;[];91;;{{Anguillian;Anguillian};{Anguillane;Anguillan}}
{ÅlandIslands;ÅlandIslands;{swe:{official:LandskapetÅland;common:Åland}}};[.ax];AX;248;ALA;;false;officially-assigned;false;;{EUR:{name:Euro;symbol:}};{+3;[5818]};[Mariehamn];[AX;Aaland;Aland;Ahvenanmaa];Europe;NorthernEurope;{swe:Swedish};{{جزرأولاند;جزرأولاند};{IniziÅland;Åland};{Ålandskéostrovy;Ålandy};{Åland-Inseln;Åland};{Ahvenamaamaakond;Ahvenamaa};{Ahvenanmaanmaakunta;Ahvenanmaa};{Ahvenanmaa;Ahvenanmaa};{AlandIslands;Ålandskiotoci};{Åland-szigetek;Åland-szigetek};{IsoleÅland;IsoleAland};{;};{;};{Ålandeilanden;Ålandeilanden};{جزایرالند;جزایرالند};{WyspyAlandzkie;WyspyAlandzkie};{IlhasÅland;Alândia};{Аландскиеострова;Аландскиеострова};{Alandskéostrovy;Alandy};{IslasÅland;Alandia};{OlandskaOstrva;OlandskaOstrva};{Åland;Åland};{ÅlandAdaları;Åland};{جزائراولند;جزائراولند};{;}};[60.116667;19.9];false;[];1580;;{{Ålandish;Ålandish};{Ålandaise;Ålandais}}
{Albania;RepublicofAlbania;{sqi:{official:RepublikaeShqipërisë;common:Shqipëria}}};[.al];AL;008;ALB;ALB;true;officially-assigned;true;EasternEuropeanGroup;{ALL:{name:Albanianlek;symbol:L}};{+3;[55]};[Tirana];[AL;Shqipëri;Shqipëria;Shqipnia];Europe;SoutheastEurope;{sqi:Albanian};{{جمهوريةألبانيا;ألبانيا};{RepublikAlbania;Albania};{Albánskárepublika;Albánie};{RepublikAlbanien;Albanien};{AlbaaniaVabariik;Albaania};{Albaniantasavalta;Albania};{Républiqued'Albanie;Albanie};{RepublikaAlbanija;Albanija};{Albánztársaság;Albánia};{Repubblicad'Albania;Albania};{;};{;};{RepubliekAlban;Alban};{جمهوریآلبانی;آلبانی};{RepublikaAlbanii;Albania};{RepúblicadaAlbânia;Albânia};{РеспубликаАлбания;Албания};{Albánskarepublika;Albánsko};{RepúblicadeAlbania;Albania};{RepublikaAlbanija;Albanija};{RepublikenAlbanien;Albanien};{ArnavutlukCumhuriyeti;Arnavutluk};{جمہوریہالبانیا;البانیا};{;}};[41;20];false;[MNE;GRC;MKD;UNK];28748;;{{Albanian;Albanian};{Albanaise;Albanais}}
{Andorra;PrincipalityofAndorra;{cat:{official:Principatd'Andorra;common:Andorra}}};[.ad];AD;020;AND;AND;true;officially-assigned;true;WesternEuropeanandOthersGroup;{EUR:{name:Euro;symbol:}};{+3;[76]};[AndorralaVella];[AD;PrincipalityofAndorra;Principatd'Andorra];Europe;SouthernEurope;{cat:Catalan};{{إمارةأندورا;أندورا};{PriñselezhAndorra;Andorra};{Andorrskéknížect;Andorra};{FürstentumAndorra;Andorra};{AndorraVürstiriik;Andorra};{Andorranruhtinaskunta;Andorra};{Principautéd'Andorre;Andorre};{KneževinaAndora;Andora};{Andorra;Andorra};{PrincipatodiAndorra;Andorra};{;};{;};{PrinsdomAndorra;Andorra};{شاهزادهنشینآندورا;آندورا};{KsięstwoAndory;Andora};{PrincipadodeAndorra;Andorra};{КняжествоАндорра;Андорра};{Andorrskékniežatstvo;Andorra};{PrincipadodeAndorra;Andorra};{KneževinaAndora;Andora};{FurstendömetAndorra;Andorra};{AndorraPrensliği;Andorra};{اماراتِانورا;انورا};{;}};[42.5;1.5];true;[FRA;ESP];468;;{{Andorran;Andorran};{Andorrane;Andorran}}
{UnitedArabEmirates;UnitedArabEmirates;{ara:{official:الإماراتالعربيةالمتحدة;common:الإمارات}}};[.ae;امارات.];AE;784;ARE;UAE;true;officially-assigned;true;AsiaandthePacificGroup;{AED:{name:UnitedArabEmiratesdirham;symbol:د.إ}};{+9;[71]};[AbuDhabi];[AE;UAE;Emirates];Asia;WesternAsia;{ara:Arabic};{{الإماراتالعربيةالمتحدة;الإمارات};{EmirelezhioùArabUnanet;EmirelezhioùArabUnanet};{Spojenéarabskéemiráty;Spojenéarabskéemiráty};{VereinigteArabischeEmirate;VereinigteArabischeEmirate};{AraabiaÜhendemiraadid;AraabiaÜhendemiraadid};{Yhdistyneetarabiemiirikunnat;Arabiemiraatit};{Émiratsarabesunis;Émiratsarabesunis};{UjedinjeniArapskiEmirati;UjedinjeniArapskiEmirati};{EgyesültArabEmírségek;EgyesültArabEmírségek};{EmiratiArabiUniti;EmiratiArabiUniti};{;UAE};{;};{VerenigdeArabischeEmiraten;VerenigdeArabischeEmiraten};{اماراتمتحدهعربی;امارات};{ZjednoczoneEmiratyArabskie;ZjednoczoneEmiratyArabskie};{EmiradosÁrabesUnidos;EmiradosÁrabesUnidos};{ОбъединенныеАрабскиеЭмираты;ОбъединённыеАрабскиеЭмираты};{Spojenéarabskéemiráty;Spojenéarabskéemiráty};{EmiratosÁrabesUnidos;EmiratosÁrabesUnidos};{UjedinjeniArapskiEmirati;UjedinjeniArapskiEmirati};{FörenadeArabemiraten;FörenadeArabemiraten};{BirleşikArapEmirlikleri;BirleşikArapEmirlikleri};{متحدہعربامارات;متحدہعربامارات};{;}};[24;54];false;[OMN;SAU];83600;;{{Emirati;Emirati};{Emirienne;Emirien}}
{Argentina;ArgentineRepublic;{grn:{official:ArgentineRepublic;common:Argentina};spa:{official:RepúblicaArgentina;common:Argentina}}};[.ar];AR;032;ARG;ARG;true;officially-assigned;true;LatinAmericanandCaribbeanGroup;{ARS:{name:Argentinepeso;symbol:$}};{+5;[4]};[BuenosAires];[AR;ArgentineRepublic;RepúblicaArgentina];Americas;SouthAmerica;{grn:Guaraní;spa:Spanish};{{جمهوريةالأرجنتين;الأرجنتين};{RepublikArc'hantina;Arc'hantina};{Argentinskárepublika;Argentina};{ArgentinischeRepublik;Argentinien};{ArgentinaVabariik;Argentina};{Argentiinantasavalta;Argentiina};{Républiqueargentine;Argentine};{ArgentinskiRepublika;Argentina};{Argentinztársaság;Argentína};{RepubblicaArgentina;Argentina};{;};{;};{ArgentijnseRepubliek;Argentinië};{جمهوریآرانتین;آرانتین};{RepublikaArgentyńska;Argentyna};{RepúblicaArgentina;Argentina};{АргентинскаяРеспублика;Аргентина};{Argentínskarepublika;Argentína};{RepúblicaArgentina;Argentina};{RepublikaArgentina;Argentina};{RepublikenArgentina;Argentina};{ArjantinCumhuriyeti;Arjantin};{جمہوریہارجنائن;ارجنائن};{;}};[-34;-64];false;[BOL;BRA;CHL;PRY;URY];2780400;;{{Argentine;Argentine};{Argentine;Argentin}}
{Armenia;RepublicofArmenia;{hye:{official:ՀայաստանիՀանրապետություն;common:Հայաստան}}};[.am];AM;051;ARM;ARM;true;officially-assigned;true;EasternEuropeanGroup;{AMD:{name:Armeniandram;symbol:}};{+3;[74]};[Yerevan];[AM;Hayastan;RepublicofArmenia;ՀայաստանիՀանրապետություն];Asia;WesternAsia;{hye:Armenian};{{جمهوريةأرمينيا;أرمينيا};{RepublikArmenia;Armenia};{Arménskárepublika;Arménie};{RepublikArmenien;Armenien};{ArmeeniaVabariik;Armeenia};{Armeniantasavalta;Armenia};{Républiqued'Arménie;Arménie};{RepublikaArmenija;Armenija};{Örményország;Örményország};{RepubblicadiArmenia;Armenia};{;};{;};{RepubliekArmen;Armen};{جمهوریارمنستان;ارمنستان};{RepublikaArmenii;Armenia};{RepúblicadaArménia;Arménia};{РеспубликаАрмения;Армения};{Arménskarepublika;Arménsko};{RepúblicadeArmenia;Armenia};{RepublikaJermenija;Jermenija};{RepublikenArmenien;Armenien};{ErmenistanCumhuriyeti;Ermenistan};{جمہوریہآرمینیا;آرمینیا};{;}};[40;45];true;[AZE;GEO;IRN;TUR];29743;;{{Armenian;Armenian};{Arménienne;Arménien}}
{AmericanSamoa;AmericanSamoa;{eng:{official:AmericanSamoa;common:AmericanSamoa};smo:{official:SāmoaAmelika;common:SāmoaAmelika}}};[.as];AS;016;ASM;ASA;false;officially-assigned;false;;{USD:{name:UnitedStatesdollar;symbol:$}};{+1;[684]};[PagoPago];[AS;AmerikaSāmoa;AmelikaSāmoa;SāmoaAmelika];Oceania;Polynesia;{eng:English;smo:Samoan};{{سامواالأمريكية;سامواالأمريكية};{SamoaAmerikan;SamoaAmerikan};{AmerickáSamoa;AmerickáSamoa};{Amerikanisch-Samoa;Amerikanisch-Samoa};{AmeerikaSamoa;AmeerikaSamoa};{AmerikanSamoa;AmerikanSamoa};{Samoaaméricaines;Samoaaméricaines};{amerkaSamoa;AmerkaSamoa};{Szamoa;Szamoa};{Samoaamericane;SamoaAmericane};{;};{;};{AmerikaansSamoa;AmerikaansSamoa};{ساموآیآمریکا;ساموآیآمریکا};{SamoaAmerykańskie;SamoaAmerykańskie};{Samoaamericana;SamoaAmericana};{американскоеСамоа;АмериканскоеСамоа};{AmerickáSamoa;AmerickáSamoa};{SamoaAmericana;SamoaAmericana};{AmerkaSamoa;AmerkaSamoa};{AmerikanskaSamoa;AmerikanskaSamoa};{AmerikanSamoası;AmerikanSamoası};{امریکیسمووا;امریکیسمووا};{;}};[-14.33333333;-170];false;[];199;;{{AmericanSamoan;AmericanSamoan};{Samoane;Samoan}}
{Antarctica;Antarctica;{}};[.aq];AQ;010;ATA;;false;officially-assigned;false;;{};{;[]};[];[AQ];Antarctic;;{};{{أنتارتيكا;أنتارتيكا};{Antarktika;Antarktika};{Antarktida;Antarktida};{Antarktika;Antarktis};{Antarktika;Antarktika};{Etelämanner;Etelämanner};{Antarctique;Antarctique};{Antarktika;Antarktika};{Antarktisz;Antarktisz};{Antartide;Antartide};{;};{;};{Antarctica;Antarctica};{جنوبگان;جنوبگان};{Antarktyka;Antarktyka};{Antártica;Antártida};{Антарктида;Антарктида};{Antarktída;Antarktída};{Antártida;Antártida};{Antarktik;Antarktik};{Antarktis;Antarktis};{Antarktika;Antarktika};{انارککا;انارککا};{;}};[-90;0];false;[];14000000;;{{Antarctican;Antarctican};{Antarcticaine;Antarcticain}}
{FrenchSouthernandAntarcticLands;TerritoryoftheFrenchSouthernandAntarcticLands;{fra:{official:TerritoiredesTerresaustralesetantarctiquesfrançaises;common:Terresaustralesetantarctiquesfrançaises}}};[.tf];TF;260;ATF;;false;officially-assigned;false;;{EUR:{name:Euro;symbol:}};{+2;[62]};[Port-aux-Français];[TF;FrenchSouthernTerritories];Antarctic;;{fra:French};{{مقاطعاتوأقاليمماوراءالبحارالفرنسية;أراضفرنسيةجنوبيةوأنتارتيكية};{TiriadDouaroùAostralhagAntarktikelFrañs;DouaroùAostralhagAntarktikelFrañs};{TeritoriumFrancouzskájižaantarktickáúzemí;Francouzskájižaantarktickáúzemí};{GebietderFranzösischSüd-undAntarktisgebiete;FranzösischeSüd-undAntarktisgebiete};{PrantsuseLõunaalad;PrantsuseLõunaalad};{Ranskaneteläisetjaantarktisetalueet;Ranskaneteläisetjaantarktisetalueet};{TerritoiredesTerresaustralesetantarctiquesfrançaises;Terresaustralesetantarctiquesfrançaises};{TeritorijuFrancuskijužniiantarktičkiteritoriji;Francuskijužniiantarktičkiteritoriji};{Francialiésantarktisziterületek;Francialiésantarktisziterületek};{TerritoriodellaaustralieantartichefrancesiTerre;TerritoriFrancesidelSud};{;};{;};{GrondgebiedvandeFranseZuidelijkeenAntarctischegebieden;FranseGebiedenindezuidelijkeIndischeOceaan};{سرزمینهایجنوبیوجنوبگانیفرانسه;سرزمینهایجنوبیوجنوبگانیفرانسه};{FrancuskieTerytoriaPołudnioweiAntarktyczne;FrancuskieTerytoriaPołudnioweiAntarktyczne};{TerritóriodoSuleAntárticaFrancesa;TerrasAustraiseAntárticasFrancesas};{ТерриторияФранцузскиеЮжныеиАнтарктическиеземли;ФранцузскиеЮжныеиАнтарктическиетерритории};{Francúzskejužaantarktickéúzemia;FrancúzskejuŽaantarktickéúzemia};{TerritoriodelFrancésTierrasaustralesyantárticas;TierrasAustralesyAntárticasFrancesas};{Francuskejužneiantarktičkezemlje;Francuskejužneiantarktičkezemlje};{Franskasyd-ochAntarktisterritorierna;Franskasödraterritorierna};{FransızneyveAntarktikaToprakları;FransızneyveAntarktikaToprakları};{سرزمینِجنوبیفرانسیسیہوانارکیکہ;سرزمینجنوبیفرانسیسیہوانارکیکا};{;}};[-49.25;69.167];false;[];7747;;{{French;French};{Française;Français}}
{AntiguaandBarbuda;AntiguaandBarbuda;{eng:{official:AntiguaandBarbuda;common:AntiguaandBarbuda}}};[.ag];AG;028;ATG;ANT;true;officially-assigned;true;LatinAmericanandCaribbeanGroup;{XCD:{name:EasternCaribbeandollar;symbol:$}};{+1;[268]};[SaintJohn's];[AG];Americas;Caribbean;{eng:English};{{أنتيغواوباربودا;أنتيغواوباربودا};{AntiguahaBarbuda;AntiguahaBarbuda};{AntiguaaBarbuda;AntiguaaBarbuda};{AntiguaundBarbuda;AntiguaundBarbuda};{AntiguajaBarbuda;AntiguajaBarbuda};{AntiguajaBarbuda;AntiguajaBarbuda};{Antigua-et-Barbuda;Antigua-et-Barbuda};{AntigvaiBarbuda;AntigvaiBarbuda};{AntiguaésBarbuda;AntiguaésBarbuda};{AntiguaeBarbuda;AntiguaeBarbuda};{;};{;};{AntiguaenBarbuda;AntiguaenBarbuda};{آنتیگواوباربودا;آنتیگواوباربودا};{AntiguaiBarbuda;AntiguaiBarbuda};{AntiguaeBarbuda;AntíguaeBarbuda};{АнтигуаиБарбуда;АнтигуаиБарбуда};{AntiguaaBarbuda;AntiguaaBarbuda};{AntiguayBarbuda;AntiguayBarbuda};{AntigvaiBarbuda;AntigvaiBarbuda};{AntiguaochBarbuda;AntiguaochBarbuda};{AntiguaveBarbuda;AntiguaveBarbuda};{اینیگواوباربوا;اینیگواوباربوا};{;}};[17.05;-61.8];false;[];442;;{{Antiguan,Barbudan;Antiguan,Barbudan};{Antiguaiseetbarbudienne;Antiguaiseetbarbudien}}
{Australia;CommonwealthofAustralia;{eng:{official:CommonwealthofAustralia;common:Australia}}};[.au];AU;036;AUS;AUS;true;officially-assigned;true;WesternEuropeanandOthersGroup;{AUD:{name:Australiandollar;symbol:$}};{+6;[1]};[Canberra];[AU];Oceania;AustraliaandNewZealand;{eng:English};{{كومونولثأستراليا;أستراليا};{KengladAostralia;Aostralia};{Australskéspolečenství;Austrálie};{CommonwealthAustralien;Australien};{AustraaliaÜhendus;Austraalia};{Australianliittovaltio;Australia};{Australie;Australie};{CommonwealthofAustralia;Australija};{AusztrálÁllamszövetség;Ausztrália};{Commonwealthdell'Australia;Australia};{;};{;};{GemenebestvanAustral;Austral};{قلمروهمسوداسترالیا;استرالیا};{ZwiązekAustralijski;Australia};{ComunidadedaAustrália;Austrália};{СодружествоАвстралии;Австралия};{Austrálskyzz;Austrália};{MancomunidaddeAustralia;Australia};{KomonveltAustralija;Australija};{Australiskastatsförbundet;Australien};{AvustralyaFederalDevleti;Avustralya};{دولتِمشترکہآسریلیا;آسریلیا};{;}};[-27;133];false;[];7692024;;{{Australian;Australian};{Australienne;Australien}}
{Austria;RepublicofAustria;{bar:{official:RepublikÖsterreich;common:Österreich}}};[.at];AT;040;AUT;AUT;true;officially-assigned;true;WesternEuropeanandOthersGroup;{EUR:{name:Euro;symbol:}};{+4;[3]};[Vienna];[AT;Osterreich;Oesterreich];Europe;CentralEurope;{bar:Austro-BavarianGerman};{{جمهوريةالنمسا;النمسا};{RepublikAostria;Aostria};{Rakousrepublika;Rakousko};{RepublikÖsterreich;Österreich};{AustriaVabariik;Austria};{Itävallantasavalta;Itävalta};{Républiqued'Autriche;Autriche};{RepublikaAustrija;Austrija};{Ausztria;Ausztria};{Repubblicad'Austria;Austria};{;};{;};{RepubliekOostenrijk;Oostenrijk};{جمهوریاتریش;اتریش};{RepublikaAustrii;Austria};{RepúblicadaÁustria;Áustria};{АвстрийскаяРеспублика;Австрия};{Rakúskarepublika;Rakúsko};{RepúblicadeAustria;Austria};{RepublikaAustrija;Austrija};{RepublikenÖsterrike;Österrike};{AvusturyaCumhuriyeti;Avusturya};{جمہوریہآسریا;آسریا};{;}};[47.33333333;13.33333333];true;[CZE;DEU;HUN;ITA;LIE;SVK;SVN;CHE];83871;;{{Austrian;Austrian};{Autrichienne;Autrichien}}
{Azerbaijan;RepublicofAzerbaijan;{aze:{official:AzərbaycanRespublikası;common:Azərbaycan};rus:{official:АзербайджанскаяРеспублика;common:Азербайджан}}};[.az];AZ;031;AZE;AZE;true;officially-assigned;true;EasternEuropeanGroup;{AZN:{name:Azerbaijanimanat;symbol:}};{+9;[94]};[Baku];[AZ;RepublicofAzerbaijan;AzərbaycanRespublikası];Asia;WesternAsia;{aze:Azerbaijani;rus:Russian};{{جمهوريةأذربيجان;أذربيجان};{RepublikAzerbaidjan;Azerbaidjan};{Ázerbájdžánskárepublika;Ázerbájdžán};{RepublikAserbaidschan;Aserbaidschan};{AserbaidžaaniVabariik;Aserbaidžaan};{Azerbaidzanintasavalta;Azerbaidzan};{Républiqued'Azerbaïdjan;Azerbaïdjan};{RepublikaAzerbajdžan;Azerbajdžan};{Azerbajdzsán;Azerbajdzsán};{Repubblicadell'Azerbaigian;Azerbaijan};{;};{;};{RepubliekAzerbeidzjan;Azerbeidzjan};{جمهوریآذربایجان;جمهوریآذربایجان};{RepublikaAzerbejdżanu;Azerbejdżan};{RepúblicadoAzerbaijão;Azerbeijão};{АзербайджанскаяРеспублика;Азербайджан};{Azerbajanskárepublika;Azerbajan};{RepúblicadeAzerbaiyán;Azerbaiyán};{RepublikaAzerbejdžan;Azerbejdžan};{RepublikenAzerbajdzjan;Azerbajdzjan};{AzerbaycanCumhuriyeti;Azerbaycan};{جمہوریہآذربائیجان;آذربائیجان};{;}};[40.5;47.5];true;[ARM;GEO;IRN;RUS;TUR];86600;;{{Azerbaijani;Azerbaijani};{Azerbaïdjanaise;Azerbaïdjanais}}
{Burundi;RepublicofBurundi;{fra:{official:RépubliqueduBurundi;common:Burundi};run:{official:Republikay'Uburundi;common:Uburundi}}};[.bi];BI;108;BDI;BDI;true;officially-assigned;true;AfricanGroup;{BIF:{name:Burundianfranc;symbol:Fr}};{+2;[57]};[Gitega];[BI;RepublicofBurundi;Republikay'Uburundi;RépubliqueduBurundi];Africa;EasternAfrica;{fra:French;run:Kirundi};{{جمهوريةبوروندي;بوروندي};{RepublikBurundi;Burundi};{Burundskárepublika;Burundi};{RepublikBurundi;Burundi};{BurundiVabariik;Burundi};{Burundintasavalta;Burundi};{RépubliqueduBurundi;Burundi};{Burundi;Burundi};{Burundi;Burundi};{RepubblicadelBurundi;Burundi};{;};{;};{RepubliekBurundi;Burundi};{جمهوریبوروندی;بوروندی};{RepublikaBurundi;Burundi};{RepúblicadoBurundi;Burundi};{РеспубликаБурунди;Бурунди};{Burundskárepublika;Burundi};{RepúblicadeBurundi;Burundi};{RepublikaBurundi;Burundi};{RepublikenBurundi;Burundi};{BurundiCumhuriyeti;Burundi};{جمہوریہبرونی;برونی};{;}};[-3.5;30];true;[COD;RWA;TZA];27834;;{{Burundian;Burundian};{Burundaise;Burundais}}
{Belgium;KingdomofBelgium;{deu:{official:KönigreichBelgien;common:Belgien};fra:{official:RoyaumedeBelgique;common:Belgique};nld:{official:KoninkrijkBelgië;common:België}}};[.be];BE;056;BEL;BEL;true;officially-assigned;true;WesternEuropeanandOthersGroup;{EUR:{name:Euro;symbol:}};{+3;[2]};[Brussels];[BE;België;Belgie;Belgien;Belgique;KingdomofBelgium;KoninkrijkBelgië;RoyaumedeBelgique;KönigreichBelgien];Europe;WesternEurope;{deu:German;fra:French;nld:Dutch};{{مملكةبلجيكا;بلجيكا};{RouantelezhBelgia;Belgia};{Belgickéklovství;Belgie};{KönigreichBelgien;Belgien};{BelgiaKuningriik;Belgia};{Belgiankuningaskunta;Belgia};{RoyaumedeBelgique;Belgique};{KraljevinaBelgija;Belgija};{BelgaKirályság;Belgium};{RegnodelBelgio;Belgio};{;};{;};{KoninkrijkBelgië;België};{پادشاهیبلیک;بلیک};{KrólestwoBelgii;Belgia};{ReinodaBélgica;Bélgica};{КоролевствоБельгия;Бельгия};{Belgickékľovstvo;Belgicko};{ReinodeBélgica;Bélgica};{KraljevinaBelgija;Belgija};{KonungariketBelgien;Belgien};{BelçikaKrallığı;Belçika};{مملکتِبلجئیم;بلجئیم};{;}};[50.83333333;4];false;[FRA;DEU;LUX;NLD];30528;;{{Belgian;Belgian};{Belge;Belge}}
{Benin;RepublicofBenin;{fra:{official:RépubliqueduBénin;common:Bénin}}};[.bj];BJ;204;BEN;BEN;true;officially-assigned;true;AfricanGroup;{XOF:{name:WestAfricanCFAfranc;symbol:Fr}};{+2;[29]};[Porto-Novo];[BJ;RepublicofBenin;RépubliqueduBénin];Africa;WesternAfrica;{fra:French};{{جمهوريةبنين;بنين};{RepublikBenin;Benin};{Beninskárepublika;Benin};{RepublikBenin;Benin};{BeniniVabariik;Benin};{Beninintasavalta;Benin};{RépubliqueduBénin;Bénin};{RepublikaBenin;Benin};{Beniniztársaság;Benin};{RepubblicadelBenin;Benin};{;};{;};{RepubliekBenin;Benin};{جمهوریبنین;بنین};{Benin;Benin};{RepúblicadoBenin;Benin};{РеспубликаБенин;Бенин};{Beninskárepublika;Benin};{RepúblicadeBenin;Benín};{RepublikaBenin;Benin};{RepublikenBenin;Benin};{BeninCumhuriyeti;Benin};{جمہوریہبینن;بینن};{;}};[9.5;2.25];false;[BFA;NER;NGA;TGO];112622;;{{Beninese;Beninese};{Béninoise;Béninois}}
{BurkinaFaso;BurkinaFaso;{fra:{official:RépubliqueduBurkina;common:BurkinaFaso}}};[.bf];BF;854;BFA;BUR;true;officially-assigned;true;AfricanGroup;{XOF:{name:WestAfricanCFAfranc;symbol:Fr}};{+2;[26]};[Ouagadougou];[BF];Africa;WesternAfrica;{fra:French};{{بوركينافاسو;بوركينافاسو};{BurkinaFaso;BurkinaFaso};{BurkinaFaso;BurkinaFaso};{BurkinaFaso;BurkinaFaso};{BurkinaFaso;BurkinaFaso};{BurkinaFaso;BurkinaFaso};{RépubliqueduBurkina;BurkinaFaso};{BurkinaFaso;BurkinaFaso};{BurkinaFaso;Burkina};{BurkinaFaso;BurkinaFaso};{;};{;};{BurkinaFaso;BurkinaFaso};{بورکینافاسو;بورکینافاسو};{BurkinaFaso;BurkinaFaso};{BurkinaFaso;BurkinaFaso};{Буркина-Фасо;Буркина-Фасо};{BurkinaFaso;BurkinaFaso};{BurkinaFaso;BurkinaFaso};{BurkinaFaso;BurkinaFaso};{BurkinaFaso;BurkinaFaso};{BurkinaFaso;BurkinaFaso};{برکینافاسو;برکینافاسو};{;}};[13;-2];true;[BEN;CIV;GHA;MLI;NER;TGO];272967;;{{Burkinabe;Burkinabe};{Burkinabée;Burkinabé}}
{Bangladesh;People'sRepublicofBangladesh;{ben:{official:;common:}}};[.bd];BD;050;BGD;BAN;true;officially-assigned;true;AsiaandthePacificGroup;{BDT:{name:Bangladeshitaka;symbol:}};{+8;[80]};[Dhaka];[BD;People'sRepublicofBangladesh;GônôprôjatôntriBangladesh];Asia;SouthernAsia;{ben:Bengali};{{جمهوريةبنغلاديشالشعبية;بنغلاديش};{RepublikpoblBangladesh;Bangladesh};{Bangladéšskálidovárepublika;Bangladéš};{VolksrepublikBangladesch;Bangladesch};{BangladeshiRahvavabariik;Bangladesh};{Bangladeshinkansantasavalta;Bangladesh};{LaRépubliquepopulaireduBangladesh;Bangladesh};{NarodnaRepublikaBangladeš;Bangladeš};{Banglades;Banglades};{RepubblicapopolaredelBangladesh;Bangladesh};{;};{;};{VolksrepubliekBangladesh;Bangladesh};{جمهوریخلقبنگلادش;بنگلادش};{LudowaRepublikaBangladeszu;Bangladesz};{RepúblicaPopulardoBangladesh;Bangladesh};{НароднаяРеспубликаБангладеш;Бангладеш};{Bangladéšskaľudovárepublika;Bangladéš};{RepúblicaPopulardeBangladesh;Bangladesh};{NarodnaRepublikaBangladeš;Bangladeš};{FolkrepublikenBangladesh;Bangladesh};{BangladeşHalkCumhuriyeti;Bangladeş};{عوامیجمہوریہبنگلہدیش;بنگلہدیش};{;}};[24;90];false;[MMR;IND];147570;;{{Bangladeshi;Bangladeshi};{Bangladaise;Bangladais}}
{Bulgaria;RepublicofBulgaria;{bul:{official:РепубликаБългария;common:България}}};[.bg];BG;100;BGR;BUL;true;officially-assigned;true;EasternEuropeanGroup;{BGN:{name:Bulgarianlev;symbol:лв}};{+3;[59]};[Sofia];[BG;RepublicofBulgaria;РепубликаБългария];Europe;SoutheastEurope;{bul:Bulgarian};{{جمهوريةبلغاريا;بلغاريا};{RepublikBulgaria;Bulgaria};{Bulharskárepublika;Bulharsko};{RepublikBulgarien;Bulgarien};{BulgaariaVabariik;Bulgaaria};{Bulgariantasavalta;Bulgaria};{RépubliquedeBulgarie;Bulgarie};{RepublikaBugarska;Bugarska};{Bolgárztársaság;Bulgária};{RepubblicadiBulgaria;Bulgaria};{;};{;};{RepubliekBulgarije;Bulgarije};{جمهوریبلغارستان;بلغارستان};{RepublikaBułgarii;Bułgaria};{RepúblicadaBulgária;Bulgária};{РеспубликаБолгария;Болгария};{Bulharskárepublika;Bulharsko};{RepúblicadeBulgaria;Bulgaria};{RepublikaBugarska;Bugarska};{RepublikenBulgarien;Bulgarien};{BulgaristanCumhuriyeti;Bulgaristan};{جمہوریہبلغاریہ;بلغاریہ};{;}};[43;25];false;[GRC;MKD;ROU;SRB;TUR];110879;;{{Bulgarian;Bulgarian};{Bulgare;Bulgare}}
{Bahrain;KingdomofBahrain;{ara:{official:مملكةالبحرين;common:البحرين}}};[.bh];BH;048;BHR;BRN;true;officially-assigned;true;AsiaandthePacificGroup;{BHD:{name:Bahrainidinar;symbol:.د.ب}};{+9;[73]};[Manama];[BH;KingdomofBahrain;Mamlakatal-Barayn];Asia;WesternAsia;{ara:Arabic};{{مملكةالبحرين;البحرين};{RouantelezhBahrein;Bahrein};{KlovstvíBahrajn;Bahrajn};{KönigreichBahrain;Bahrain};{BahreiniKuningriik;Bahrein};{Bahraininkuningaskunta;Bahrain};{RoyaumedeBahreïn;Bahreïn};{KraljevinaBahrein;Bahrein};{BahreiniKirályság;Bahrein};{RegnodelBahrain;Bahrein};{;};{;};{KoninkrijkBahrein;Bahrein};{پادشاهیبحرین;بحرین};{KrólestwoBahrajnu;Bahrajn};{ReinodoBahrein;Bahrein};{КоролевствоБахрейн;Бахрейн};{Bahrajnskékľovstvo;Bahrajn};{ReinodeBahrein;Bahrein};{KraljevinaBahrein;Bahrein};{KonungariketBahrain;Bahrain};{BahreynKrallığı;Bahreyn};{مملکتِبحرین;بحرین};{;}};[26;50.55];false;[];765;;{{Bahraini;Bahraini};{Bahreïnienne;Bahreïnien}}
... (truncated)
large_non_uniform_nested_mixed.json — Original: 2402 chars — Tokenizer: llama (NousResearch/Llama-2-7b-hf)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)2,4021,0032.42.4
JSON (min)1,5005224.62.9
CSVN/A
TSVN/A
YAML1,5736173.92.5
TOON1,7666253.82.8
TSON1,2755604.32.3
minemizer1,2034525.32.7
minemizer (compact)1,0724625.22.3
JSON (pretty)
chars: 2,402 tokens: 1,003 chars_og/tok: 2.4 enc_chars/tok: 2.4
<s>[
{
··"id":1,
··"name":"Alice",
··"work":{
····"title":"SeniorEngineer",
····"years":5,
····"remote":true,
····"team":"Platform"
··},
··"contact":{
····"email":"alice@co.com"
··}
},
{
··"id":2,
··"profile":{
····"age":28,
····"city":"NYC",
····"verified":true
··},
··"status":"active",
··"permissions":{
····"admin":false,
····"editor":true
... (truncated)
JSON (min)
chars: 1,500 tokens: 522 chars_og/tok: 4.6 enc_chars/tok: 2.9
<s>[{"id":1,"name":"Alice","work":{"title":"SeniorEngineer","years":5,"remote":true,"team":"Platform"},"contact":{"email":"alice@co.com"}},{"id":2,"profile":{"age":28,"city":"NYC","verified":true},"status":"active","permissions":{"admin":false,"editor":true}},{"id":3,"name":"Charlie","contact":{"email":"c@example.com","preferred":"email","phone":"555-0103"},"metadata":{"created":"2019-06-10"}},{"id":4,"user":{"username":"diana","role":"admin","level":5},"metadata":{"created":"2020-09-01","updated":"2024-01-20"},"settings":{"theme":"dark"}},{"id":5,"employee":{"name":"EveAdams","department":"Sales"},"performance":{"score":85,"reviews":3},"contact":{"email":"eve@co.com","slack":"@eve"}},{"id":6,"name":"Frank","work":{"title":"ProductManager","years":8,"remote":false,"team":"Growth"},"contact":{"email":"frank@co.com","phone":"555-0106"}},{"id":7,"profile":{"age":35,"city":"LA","verified":false},"status":"inactive","permissions":{"admin":true,"editor":false},"metadata":{"created":"2018-03-15"}},{"id":8,"name":"Grace","contact":{"email":"grace@example.org","preferred":"slack","slack":"@grace"},"settings":{"theme":"light","notifications":true}},{"id":9,"user":{"username":"henry","role":"viewer","level":2},"employee":{"name":"HenryWilson","department":"Marketing"},"performance":{"score":72,"reviews":5}},{"id":10,"name":"Iris","work":{"title":"Designer","years":3,"remote":true,"team":"Creative"},"profile":{"age":26,"city":"Austin","verified":true},"contact":{"email":"iris@co.com"}}]
CSV: N/A
TSV: N/A
YAML
chars: 1,573 tokens: 617 chars_og/tok: 3.9 enc_chars/tok: 2.5
<s>-contact:
··email:alice@co.com
id:1
name:Alice
work:
··remote:true
··team:Platform
··title:SeniorEngineer
··years:5
-id:2
permissions:
··admin:false
··editor:true
profile:
··age:28
··city:NYC
··verified:true
status:active
-contact:
··email:c@example.com
··phone:555-0103
··preferred:email
id:3
metadata:
··created:'2019-06-10'
... (truncated)
TOON
chars: 1,766 tokens: 625 chars_og/tok: 3.8 enc_chars/tok: 2.8
<s>[10]:
-id:1
··name:Alice
··work:
····title:SeniorEngineer
····years:5
····remote:true
····team:Platform
··contact:
····email:alice@co.com
-id:2
··profile:
····age:28
····city:NYC
····verified:true
··status:active
··permissions:
····admin:false
····editor:true
-id:3
··name:Charlie
··contact:
····email:c@example.com
····preferred:email
····phone:555-0103
... (truncated)
TSON
chars: 1,275 tokens: 560 chars_og/tok: 4.3 enc_chars/tok: 2.3
<s>[{@id,name,work,contact|1,Alice,{@title,years,remote,team|"SeniorEngineer",5,true,Platform},{@email|"alice@co.com"}},{@id,profile,status,permissions|2,{@age,city,verified|28,NYC,true},active,{@admin,editor|false,true}},{@id,name,contact,metadata|3,Charlie,{@email,preferred,phone|"c@example.com",email,555-0103},{@created|2019-06-10}},{@id,user,metadata,settings|4,{@username,role,level|diana,admin,5},{@created,updated|2020-09-01,2024-01-20},{@theme|dark}},{@id,employee,performance,contact|5,{@name,department|"EveAdams",Sales},{@score,reviews|85,3},{@email,slack|"eve@co.com","@eve"}},{@id,name,work,contact|6,Frank,{@title,years,remote,team|"ProductManager",8,false,Growth},{@email,phone|"frank@co.com",555-0106}},{@id,profile,status,permissions,metadata|7,{@age,city,verified|35,LA,false},inactive,{@admin,editor|true,false},{@created|2018-03-15}},{@id,name,contact,settings|8,Grace,{@email,preferred,slack|"grace@example.org",slack,"@grace"},{@theme,notifications|light,true}},{@id,user,employee,performance|9,{@username,role,level|henry,viewer,2},{@name,department|"HenryWilson",Marketing},{@score,reviews|72,5}},{@id,name,work,profile,contact|10,Iris,{@title,years,remote,team|Designer,3,true,Creative},{@age,city,verified|26,Austin,true},{@email|"iris@co.com"}}]
minemizer
chars: 1,203 tokens: 452 chars_og/tok: 5.3 enc_chars/tok: 2.7
<s>id;name;contact{email;...}
1;Alice;{alice@co.com};work{title:SeniorEngineer;years:5;remote:true;team:Platform}
2;;;profile{age:28;city:NYC;verified:true};status:active;permissions{admin:false;editor:true}
3;Charlie;{c@example.com;preferred:email;phone:555-0103};metadata{created:2019-06-10}
4;;;user{username:diana;role:admin;level:5};metadata{created:2020-09-01;updated:2024-01-20};settings{theme:dark}
5;;{eve@co.com;slack:@eve};employee{name:EveAdams;department:Sales};performance{score:85;reviews:3}
6;Frank;{frank@co.com;phone:555-0106};work{title:ProductManager;years:8;remote:false;team:Growth}
7;;;profile{age:35;city:LA;verified:false};status:inactive;permissions{admin:true;editor:false};metadata{created:2018-03-15}
8;Grace;{grace@example.org;preferred:slack;slack:@grace};settings{theme:light;notifications:true}
9;;;user{username:henry;role:viewer;level:2};employee{name:HenryWilson;department:Marketing};performance{score:72;reviews:5}
10;Iris;{iris@co.com};work{title:Designer;years:3;remote:true;team:Creative};profile{age:26;city:Austin;verified:true}
minemizer (compact)
chars: 1,072 tokens: 462 chars_og/tok: 5.2 enc_chars/tok: 2.3
<s>id;name;contact{email;...}
1;Alice;{alice@co.com};work{title:SeniorEngineer;years:5;remote:true;team:Platform}
2;;;profile{age:28;city:NYC;verified:true};status:active;permissions{admin:false;editor:true}
3;Charlie;{c@example.com;preferred:email;phone:555-0103};metadata{created:2019-06-10}
4;;;user{username:diana;role:admin;level:5};metadata{created:2020-09-01;updated:2024-01-20};settings{theme:dark}
5;;{eve@co.com;slack:@eve};employee{name:EveAdams;department:Sales};performance{score:85;reviews:3}
6;Frank;{frank@co.com;phone:555-0106};work{title:ProductManager;years:8;remote:false;team:Growth}
7;;;profile{age:35;city:LA;verified:false};status:inactive;permissions{admin:true;editor:false};metadata{created:2018-03-15}
8;Grace;{grace@example.org;preferred:slack;slack:@grace};settings{theme:light;notifications:true}
9;;;user{username:henry;role:viewer;level:2};employee{name:HenryWilson;department:Marketing};performance{score:72;reviews:5}
10;Iris;{iris@co.com};work{title:Designer;years:3;remote:true;team:Creative};profile{age:26;city:Austin;verified:true}
large_non_uniform_nested_numerical.json — Original: 2947 chars — Tokenizer: llama (NousResearch/Llama-2-7b-hf)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)2,9471,5421.91.9
JSON (min)1,8739763.01.9
CSVN/A
TSVN/A
YAML2,0851,1712.51.8
TOON2,3181,1782.52.0
TSON1,6429933.01.7
minemizer1,5349403.11.6
minemizer (compact)1,3618753.41.6
JSON (pretty)
chars: 2,947 tokens: 1,542 chars_og/tok: 1.9 enc_chars/tok: 1.9
<s>[
{
··"id":1,
··"metrics":{
····"views":15420,
····"clicks":842,
····"ctr":0.0546,
····"bounce_rate":0.32
··},
··"revenue":{
····"amount":12499.99,
····"currency_rate":1.0
··},
··"timestamp":"2024-01-15T09:30:00Z"
},
{
··"id":2,
··"metrics":{
····"views":8923,
····"clicks":156,
····"ctr":0.0175,
····"bounce_rate":0.67
··},
··"stats":{
····"avg_time":45.7,
... (truncated)
JSON (min)
chars: 1,873 tokens: 976 chars_og/tok: 3.0 enc_chars/tok: 1.9
<s>[{"id":1,"metrics":{"views":15420,"clicks":842,"ctr":0.0546,"bounce_rate":0.32},"revenue":{"amount":12499.99,"currency_rate":1.0},"timestamp":"2024-01-15T09:30:00Z"},{"id":2,"metrics":{"views":8923,"clicks":156,"ctr":0.0175,"bounce_rate":0.67},"stats":{"avg_time":45.7,"pages_per_session":2.3,"return_rate":0.15},"timestamp":"2024-01-16T14:22:33Z"},{"id":3,"revenue":{"amount":8750.5,"tax":700.04,"net":8050.46,"currency_rate":0.92},"inventory":{"count":342,"reserved":28,"available":314}},{"id":4,"metrics":{"views":52100,"clicks":3891,"ctr":0.0747,"bounce_rate":0.21},"performance":{"latency_ms":127.5,"uptime":0.9987,"errors":3},"timestamp":"2024-01-17T08:00:00Z"},{"id":5,"stats":{"avg_time":128.9,"pages_per_session":5.7,"return_rate":0.42},"scores":{"quality":94,"relevance":87,"engagement":0.78},"dates":{"start":"2023-06-01","end":"2024-01-31"}},{"id":6,"inventory":{"count":1205,"reserved":89,"available":1116,"reorder_point":200},"pricing":{"cost":24.99,"markup":0.35,"price":33.74},"timestamp":"2024-01-18T11:45:12Z"},{"id":7,"metrics":{"views":3156,"clicks":98,"ctr":0.031,"bounce_rate":0.55},"revenue":{"amount":2150.0,"tax":172.0,"net":1978.0},"performance":{"latency_ms":89.2,"uptime":0.9995,"errors":0}},{"id":8,"scores":{"quality":78,"relevance":92,"engagement":0.65,"nps":45},"dates":{"start":"2022-11-15","end":"2024-02-28","renewal":"2024-03-01"},"budget":{"allocated":50000,"spent":42350.75,"remaining":7649.25}},{"id":9,"pricing":{"cost":149.99,"markup":0.28,"price":191.99,"discount":0.1},"inventory":{"count":56,"reserved":12,"available":44},"timestamp":"2024-01-19T16:30:45Z"},{"id":10,"metrics":{"views":128750,"clicks":9823,"ctr":0.0763,"bounce_rate":0.18},"stats":{"avg_time":312.4,"pages_per_session":8.2,"return_rate":0.58},"budget":{"allocated":125000,"spent":98420.33,"remaining":26579.67},"dates":{"start":"2023-01-01","end":"2024-12-31"}}]
CSV: N/A
TSV: N/A
YAML
chars: 2,085 tokens: 1,171 chars_og/tok: 2.5 enc_chars/tok: 1.8
<s>-id:1
metrics:
··bounce_rate:0.32
··clicks:842
··ctr:0.0546
··views:15420
revenue:
··amount:12499.99
··currency_rate:1.0
timestamp:'2024-01-15T09:30:00Z'
-id:2
metrics:
··bounce_rate:0.67
··clicks:156
··ctr:0.0175
··views:8923
stats:
··avg_time:45.7
··pages_per_session:2.3
··return_rate:0.15
timestamp:'2024-01-16T14:22:33Z'
-id:3
inventory:
··available:314
··count:342
... (truncated)
TOON
chars: 2,318 tokens: 1,178 chars_og/tok: 2.5 enc_chars/tok: 2.0
<s>[10]:
-id:1
··metrics:
····views:15420
····clicks:842
····ctr:0.0546
····bounce_rate:0.32
··revenue:
····amount:12499.99
····currency_rate:1.0
··timestamp:"2024-01-15T09:30:00Z"
-id:2
··metrics:
····views:8923
····clicks:156
····ctr:0.0175
····bounce_rate:0.67
··stats:
····avg_time:45.7
····pages_per_session:2.3
····return_rate:0.15
··timestamp:"2024-01-16T14:22:33Z"
-id:3
··revenue:
····amount:8750.5
... (truncated)
TSON
chars: 1,642 tokens: 993 chars_og/tok: 3.0 enc_chars/tok: 1.7
<s>[{@id,metrics,revenue,timestamp|1,{@views,clicks,ctr,bounce_rate|15420,842,0.0546,0.32},{@amount,currency_rate|12499.99,1.0},2024-01-15T09:30:00Z},{@id,metrics,stats,timestamp|2,{@views,clicks,ctr,bounce_rate|8923,156,0.0175,0.67},{@avg_time,pages_per_session,return_rate|45.7,2.3,0.15},2024-01-16T14:22:33Z},{@id,revenue,inventory|3,{@amount,tax,net,currency_rate|8750.5,700.04,8050.46,0.92},{@count,reserved,available|342,28,314}},{@id,metrics,performance,timestamp|4,{@views,clicks,ctr,bounce_rate|52100,3891,0.0747,0.21},{@latency_ms,uptime,errors|127.5,0.9987,3},2024-01-17T08:00:00Z},{@id,stats,scores,dates|5,{@avg_time,pages_per_session,return_rate|128.9,5.7,0.42},{@quality,relevance,engagement|94,87,0.78},{@start,end|2023-06-01,2024-01-31}},{@id,inventory,pricing,timestamp|6,{@count,reserved,available,reorder_point|1205,89,1116,200},{@cost,markup,price|24.99,0.35,33.74},2024-01-18T11:45:12Z},{@id,metrics,revenue,performance|7,{@views,clicks,ctr,bounce_rate|3156,98,0.031,0.55},{@amount,tax,net|2150.0,172.0,1978.0},{@latency_ms,uptime,errors|89.2,0.9995,0}},{@id,scores,dates,budget|8,{@quality,relevance,engagement,nps|78,92,0.65,45},{@start,end,renewal|2022-11-15,2024-02-28,2024-03-01},{@allocated,spent,remaining|50000,42350.75,7649.25}},{@id,pricing,inventory,timestamp|9,{@cost,markup,price,discount|149.99,0.28,191.99,0.1},{@count,reserved,available|56,12,44},2024-01-19T16:30:45Z},{@id,metrics,stats,budget,dates|10,{@views,clicks,ctr,bounce_rate|128750,9823,0.0763,0.18},{@avg_time,pages_per_session,return_rate|312.4,8.2,0.58},{@allocated,spent,remaining|125000,98420.33,26579.67},{@start,end|2023-01-01,2024-12-31}}]
minemizer
chars: 1,534 tokens: 940 chars_og/tok: 3.1 enc_chars/tok: 1.6
<s>id;metrics{views;clicks;ctr;bounce_rate};timestamp
1;{15420;842;0.0546;0.32};2024-01-15T09:30:00Z;revenue{amount:12499.99;currency_rate:1.0}
2;{8923;156;0.0175;0.67};2024-01-16T14:22:33Z;stats{avg_time:45.7;pages_per_session:2.3;return_rate:0.15}
3;;;revenue{amount:8750.5;tax:700.04;net:8050.46;currency_rate:0.92};inventory{count:342;reserved:28;available:314}
4;{52100;3891;0.0747;0.21};2024-01-17T08:00:00Z;performance{latency_ms:127.5;uptime:0.9987;errors:3}
5;;;stats{avg_time:128.9;pages_per_session:5.7;return_rate:0.42};scores{quality:94;relevance:87;engagement:0.78};dates{start:2023-06-01;end:2024-01-31}
6;;2024-01-18T11:45:12Z;inventory{count:1205;reserved:89;available:1116;reorder_point:200};pricing{cost:24.99;markup:0.35;price:33.74}
7;{3156;98;0.031;0.55};;revenue{amount:2150.0;tax:172.0;net:1978.0};performance{latency_ms:89.2;uptime:0.9995;errors:0}
8;;;scores{quality:78;relevance:92;engagement:0.65;nps:45};dates{start:2022-11-15;end:2024-02-28;renewal:2024-03-01};budget{allocated:50000;spent:42350.75;remaining:7649.25}
9;;2024-01-19T16:30:45Z;pricing{cost:149.99;markup:0.28;price:191.99;discount:0.1};inventory{count:56;reserved:12;available:44}
10;{128750;9823;0.0763;0.18};;stats{avg_time:312.4;pages_per_session:8.2;return_rate:0.58};budget{allocated:125000;spent:98420.33;remaining:26579.67};dates{start:2023-01-01;end:2024-12-31}
minemizer (compact)
chars: 1,361 tokens: 875 chars_og/tok: 3.4 enc_chars/tok: 1.6
<s>id;metrics{views;clicks;ctr;bounce_rate};timestamp
1;{15420;842;0.0546;0.32};2024-01-15T09:30:00Z;revenue{amount:12499.99;currency_rate:1.0}
2;{8923;156;0.0175;0.67};2024-01-16T14:22:33Z;stats{avg_time:45.7;pages_per_session:2.3;return_rate:0.15}
3;;;revenue{amount:8750.5;tax:700.04;net:8050.46;currency_rate:0.92};inventory{count:342;reserved:28;available:314}
4;{52100;3891;0.0747;0.21};2024-01-17T08:00:00Z;performance{latency_ms:127.5;uptime:0.9987;errors:3}
5;;;stats{avg_time:128.9;pages_per_session:5.7;return_rate:0.42};scores{quality:94;relevance:87;engagement:0.78};dates{start:2023-06-01;end:2024-01-31}
6;;2024-01-18T11:45:12Z;inventory{count:1205;reserved:89;available:1116;reorder_point:200};pricing{cost:24.99;markup:0.35;price:33.74}
7;{3156;98;0.031;0.55};;revenue{amount:2150.0;tax:172.0;net:1978.0};performance{latency_ms:89.2;uptime:0.9995;errors:0}
8;;;scores{quality:78;relevance:92;engagement:0.65;nps:45};dates{start:2022-11-15;end:2024-02-28;renewal:2024-03-01};budget{allocated:50000;spent:42350.75;remaining:7649.25}
9;;2024-01-19T16:30:45Z;pricing{cost:149.99;markup:0.28;price:191.99;discount:0.1};inventory{count:56;reserved:12;available:44}
10;{128750;9823;0.0763;0.18};;stats{avg_time:312.4;pages_per_session:8.2;return_rate:0.58};budget{allocated:125000;spent:98420.33;remaining:26579.67};dates{start:2023-01-01;end:2024-12-31}
large_non_uniform_nested_text.json — Original: 4214 chars — Tokenizer: llama (NousResearch/Llama-2-7b-hf)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)4,2141,2683.33.3
JSON (min)3,3597925.34.2
CSVN/A
TSVN/A
YAML3,3878435.04.0
TOON3,5348465.04.2
TSON3,1738315.13.8
minemizer2,8096196.84.5
minemizer (compact)2,6946726.34.0
JSON (pretty)
chars: 4,214 tokens: 1,268 chars_og/tok: 3.3 enc_chars/tok: 3.3
<s>[
{
··"id":1,
··"title":"IntroductiontoMachineLearning",
··"author":{
····"name":"Dr.SarahChen",
····"affiliation":"StanfordUniversity",
····"department":"ComputerScience"
··},
··"abstract":"Acomprehensiveoverviewofmodernmachinelearningtechniquesandapplications",
··"tags":[
····"AI",
····"ML",
····"deeplearning"
··]
},
{
··"id":2,
··"title":"ClimateChangeImpactAssessment",
··"content":{
····"summary":"Analysisofrisingsealevelsandtemperaturepatterns",
····"methodology":"longitudinalstudywithsatelliteimagery",
····"conclusion":"significantaccelerationobservedsince2010"
··},
··"category":"EnvironmentalScience"
... (truncated)
JSON (min)
chars: 3,359 tokens: 792 chars_og/tok: 5.3 enc_chars/tok: 4.2
<s>[{"id":1,"title":"IntroductiontoMachineLearning","author":{"name":"Dr.SarahChen","affiliation":"StanfordUniversity","department":"ComputerScience"},"abstract":"Acomprehensiveoverviewofmodernmachinelearningtechniquesandapplications","tags":["AI","ML","deeplearning"]},{"id":2,"title":"ClimateChangeImpactAssessment","content":{"summary":"Analysisofrisingsealevelsandtemperaturepatterns","methodology":"longitudinalstudywithsatelliteimagery","conclusion":"significantaccelerationobservedsince2010"},"category":"EnvironmentalScience"},{"id":3,"author":{"name":"MarcusWilliams","affiliation":"MITMediaLab","role":"PrincipalResearcher"},"publication":{"journal":"NatureCommunications","volume":"fifteen","status":"peer-reviewed"},"keywords":"quantumcomputing,errorcorrection,faulttolerance"},{"id":4,"title":"UrbanPlanningStrategiesforSustainableCities","abstract":"Examininggreeninfrastructureandmixed-usedevelopmentpatterns","content":{"summary":"CasestudiesfromCopenhagen,Singapore,andPortland","methodology":"comparativeanalysiswithcommunitysurveys","findings":"walkabilitycorrelatesstronglywithresidentsatisfaction"},"tags":["urbandesign","sustainability","planning"]},{"id":5,"publication":{"journal":"TheLancet","volume":"fourhundredtwo","issue":"specialedition","status":"published"},"content":{"summary":"Globalhealthoutcomesfollowingpandemicresponsemeasures","conclusion":"earlyinterventionstrategiesprovedmosteffective"},"category":"PublicHealth"},{"id":6,"title":"AdvancesinNaturalLanguageProcessing","author":{"name":"Dr.JamesRodriguez","affiliation":"GoogleResearch","department":"LanguageUnderstanding"},"abstract":"SurveyoftransformerarchitecturesandattentionmechanismsinmodernNLPsystems","keywords":"transformers,attention,languagemodels,BERT,GPT"},{"id":7,"content":{"summary":"Historicalanalysisofeconomicpolicyshiftsinemergingmarkets","methodology":"archivalresearchcombinedwitheconometricmodeling","findings":"tradeliberalizationshowedmixedresultsacrossregions","limitations":"dataavailabilityconstraintsforpre-1990period"},"category":"Economics","tags":["policy","trade","development"]},{"id":8,"title":"BiodiversityConservationinTropicalRainforests","author":{"name":"Dr.AnaCosta","affiliation":"BrazilianInstituteforAmazonianResearch","role":"LeadEcologist"},"publication":{"journal":"ConservationBiology","status":"underreview"},"abstract":"Mappingspeciesdistributionpatternsandidentifyingcriticalhabitatcorridors"},{"id":9,"title":"BehavioralEconomicsandConsumerDecisionMaking","content":{"summary":"Experimentalstudiesoncognitivebiasesinpurchasingbehavior","methodology":"randomizedcontrolledtrialswitheye-trackingtechnology","conclusion":"anchoringeffectspersistevenwithexpertconsumers"},"keywords":"behavioraleconomics,decisiontheory,consumerpsychology","category":"Psychology"},{"id":10,"author":{"name":"Prof.MichaelThompson","affiliation":"OxfordUniversity","department":"EngineeringScience","role":"DepartmentChair"},"publication":{"journal":"AdvancedMaterials","volume":"thirty-six","status":"accepted"},"abstract":"Novelsynthesismethodsforhigh-performanceceramiccomposites","tags":["materialsscience","ceramics","nanotechnology"]}]
CSV: N/A
TSV: N/A
YAML
chars: 3,387 tokens: 843 chars_og/tok: 5.0 enc_chars/tok: 4.0
<s>-abstract:Acomprehensiveoverviewofmodernmachinelearningtechniquesandapplications
author:
··affiliation:StanfordUniversity
··department:ComputerScience
··name:Dr.SarahChen
id:1
tags:
-AI
-ML
-deeplearning
title:IntroductiontoMachineLearning
-category:EnvironmentalScience
content:
··conclusion:significantaccelerationobservedsince2010
··methodology:longitudinalstudywithsatelliteimagery
··summary:Analysisofrisingsealevelsandtemperaturepatterns
id:2
title:ClimateChangeImpactAssessment
-author:
··affiliation:MITMediaLab
··name:MarcusWilliams
··role:PrincipalResearcher
id:3
keywords:quantumcomputing,errorcorrection,faulttolerance
publication:
... (truncated)
TOON
chars: 3,534 tokens: 846 chars_og/tok: 5.0 enc_chars/tok: 4.2
<s>[10]:
-id:1
··title:IntroductiontoMachineLearning
··author:
····name:Dr.SarahChen
····affiliation:StanfordUniversity
····department:ComputerScience
··abstract:Acomprehensiveoverviewofmodernmachinelearningtechniquesandapplications
··tags[3]:AI,ML,deeplearning
-id:2
··title:ClimateChangeImpactAssessment
··content:
····summary:Analysisofrisingsealevelsandtemperaturepatterns
····methodology:longitudinalstudywithsatelliteimagery
····conclusion:significantaccelerationobservedsince2010
··category:EnvironmentalScience
-id:3
··author:
····name:MarcusWilliams
····affiliation:MITMediaLab
····role:PrincipalResearcher
··publication:
····journal:NatureCommunications
····volume:fifteen
····status:peer-reviewed
... (truncated)
TSON
chars: 3,173 tokens: 831 chars_og/tok: 5.1 enc_chars/tok: 3.8
<s>[{@id,title,author,abstract,tags|1,"IntroductiontoMachineLearning",{@name,affiliation,department|"Dr.SarahChen","StanfordUniversity","ComputerScience"},"Acomprehensiveoverviewofmodernmachinelearningtechniquesandapplications",[AI,ML,"deeplearning"]},{@id,title,content,category|2,"ClimateChangeImpactAssessment",{@summary,methodology,conclusion|"Analysisofrisingsealevelsandtemperaturepatterns","longitudinalstudywithsatelliteimagery","significantaccelerationobservedsince2010"},"EnvironmentalScience"},{@id,author,publication,keywords|3,{@name,affiliation,role|"MarcusWilliams","MITMediaLab","PrincipalResearcher"},{@journal,volume,status|"NatureCommunications",fifteen,peer-reviewed},"quantumcomputing,errorcorrection,faulttolerance"},{@id,title,abstract,content,tags|4,"UrbanPlanningStrategiesforSustainableCities","Examininggreeninfrastructureandmixed-usedevelopmentpatterns",{@summary,methodology,findings|"CasestudiesfromCopenhagen,Singapore,andPortland","comparativeanalysiswithcommunitysurveys","walkabilitycorrelatesstronglywithresidentsatisfaction"},["urbandesign",sustainability,planning]},{@id,publication,content,category|5,{@journal,volume,issue,status|"TheLancet","fourhundredtwo","specialedition",published},{@summary,conclusion|"Globalhealthoutcomesfollowingpandemicresponsemeasures","earlyinterventionstrategiesprovedmosteffective"},"PublicHealth"},{@id,title,author,abstract,keywords|6,"AdvancesinNaturalLanguageProcessing",{@name,affiliation,department|"Dr.JamesRodriguez","GoogleResearch","LanguageUnderstanding"},"SurveyoftransformerarchitecturesandattentionmechanismsinmodernNLPsystems","transformers,attention,languagemodels,BERT,GPT"},{@id,content,category,tags|7,{@summary,methodology,findings,limitations|"Historicalanalysisofeconomicpolicyshiftsinemergingmarkets","archivalresearchcombinedwitheconometricmodeling","tradeliberalizationshowedmixedresultsacrossregions","dataavailabilityconstraintsforpre-1990period"},Economics,[policy,trade,development]},{@id,title,author,publication,abstract|8,"BiodiversityConservationinTropicalRainforests",{@name,affiliation,role|"Dr.AnaCosta","BrazilianInstituteforAmazonianResearch","LeadEcologist"},{@journal,status|"ConservationBiology","underreview"},"Mappingspeciesdistributionpatternsandidentifyingcriticalhabitatcorridors"},{@id,title,content,keywords,category|9,"BehavioralEconomicsandConsumerDecisionMaking",{@summary,methodology,conclusion|"Experimentalstudiesoncognitivebiasesinpurchasingbehavior","randomizedcontrolledtrialswitheye-trackingtechnology","anchoringeffectspersistevenwithexpertconsumers"},"behavioraleconomics,decisiontheory,consumerpsychology",Psychology},{@id,author,publication,abstract,tags|10,{@name,affiliation,department,role|"Prof.MichaelThompson","OxfordUniversity","EngineeringScience","DepartmentChair"},{@journal,volume,status|"AdvancedMaterials",thirty-six,accepted},"Novelsynthesismethodsforhigh-performanceceramiccomposites",["materialsscience",ceramics,nanotechnology]}]
minemizer
chars: 2,809 tokens: 619 chars_og/tok: 6.8 enc_chars/tok: 4.5
<s>id;title;author{name;affiliation;department;role};abstract;content{summary;methodology;conclusion;...}
1;IntroductiontoMachineLearning;{Dr.SarahChen;StanfordUniversity;ComputerScience;};Acomprehensiveoverviewofmodernmachinelearningtechniquesandapplications;;tags[AI;ML;deeplearning]
2;ClimateChangeImpactAssessment;;;{Analysisofrisingsealevelsandtemperaturepatterns;longitudinalstudywithsatelliteimagery;significantaccelerationobservedsince2010};category:EnvironmentalScience
3;;{MarcusWilliams;MITMediaLab;;PrincipalResearcher};;;publication{journal:NatureCommunications;volume:fifteen;status:peer-reviewed};keywords:quantumcomputing,errorcorrection,faulttolerance
4;UrbanPlanningStrategiesforSustainableCities;;Examininggreeninfrastructureandmixed-usedevelopmentpatterns;{CasestudiesfromCopenhagen,Singapore,andPortland;comparativeanalysiswithcommunitysurveys;;findings:walkabilitycorrelatesstronglywithresidentsatisfaction};tags[urbandesign;sustainability;planning]
5;;;;{Globalhealthoutcomesfollowingpandemicresponsemeasures;;earlyinterventionstrategiesprovedmosteffective};publication{journal:TheLancet;volume:fourhundredtwo;issue:specialedition;status:published};category:PublicHealth
6;AdvancesinNaturalLanguageProcessing;{Dr.JamesRodriguez;GoogleResearch;LanguageUnderstanding;};SurveyoftransformerarchitecturesandattentionmechanismsinmodernNLPsystems;;keywords:transformers,attention,languagemodels,BERT,GPT
7;;;;{Historicalanalysisofeconomicpolicyshiftsinemergingmarkets;archivalresearchcombinedwitheconometricmodeling;;findings:tradeliberalizationshowedmixedresultsacrossregions;limitations:dataavailabilityconstraintsforpre-1990period};category:Economics;tags[policy;trade;development]
8;BiodiversityConservationinTropicalRainforests;{Dr.AnaCosta;BrazilianInstituteforAmazonianResearch;;LeadEcologist};Mappingspeciesdistributionpatternsandidentifyingcriticalhabitatcorridors;;publication{journal:ConservationBiology;status:underreview}
9;BehavioralEconomicsandConsumerDecisionMaking;;;{Experimentalstudiesoncognitivebiasesinpurchasingbehavior;randomizedcontrolledtrialswitheye-trackingtechnology;anchoringeffectspersistevenwithexpertconsumers};keywords:behavioraleconomics,decisiontheory,consumerpsychology;category:Psychology
10;;{Prof.MichaelThompson;OxfordUniversity;EngineeringScience;DepartmentChair};Novelsynthesismethodsforhigh-performanceceramiccomposites;;publication{journal:AdvancedMaterials;volume:thirty-six;status:accepted};tags[materialsscience;ceramics;nanotechnology]
minemizer (compact)
chars: 2,694 tokens: 672 chars_og/tok: 6.3 enc_chars/tok: 4.0
<s>id;title;author{name;affiliation;department;role};abstract;content{summary;methodology;conclusion;...}
1;IntroductiontoMachineLearning;{Dr.SarahChen;StanfordUniversity;ComputerScience;};Acomprehensiveoverviewofmodernmachinelearningtechniquesandapplications;;tags[AI;ML;deeplearning]
2;ClimateChangeImpactAssessment;;;{Analysisofrisingsealevelsandtemperaturepatterns;longitudinalstudywithsatelliteimagery;significantaccelerationobservedsince2010};category:EnvironmentalScience
3;;{MarcusWilliams;MITMediaLab;;PrincipalResearcher};;;publication{journal:NatureCommunications;volume:fifteen;status:peer-reviewed};keywords:quantumcomputing,errorcorrection,faulttolerance
4;UrbanPlanningStrategiesforSustainableCities;;Examininggreeninfrastructureandmixed-usedevelopmentpatterns;{CasestudiesfromCopenhagen,Singapore,andPortland;comparativeanalysiswithcommunitysurveys;;findings:walkabilitycorrelatesstronglywithresidentsatisfaction};tags[urbandesign;sustainability;planning]
5;;;;{Globalhealthoutcomesfollowingpandemicresponsemeasures;;earlyinterventionstrategiesprovedmosteffective};publication{journal:TheLancet;volume:fourhundredtwo;issue:specialedition;status:published};category:PublicHealth
6;AdvancesinNaturalLanguageProcessing;{Dr.JamesRodriguez;GoogleResearch;LanguageUnderstanding;};SurveyoftransformerarchitecturesandattentionmechanismsinmodernNLPsystems;;keywords:transformers,attention,languagemodels,BERT,GPT
7;;;;{Historicalanalysisofeconomicpolicyshiftsinemergingmarkets;archivalresearchcombinedwitheconometricmodeling;;findings:tradeliberalizationshowedmixedresultsacrossregions;limitations:dataavailabilityconstraintsforpre-1990period};category:Economics;tags[policy;trade;development]
8;BiodiversityConservationinTropicalRainforests;{Dr.AnaCosta;BrazilianInstituteforAmazonianResearch;;LeadEcologist};Mappingspeciesdistributionpatternsandidentifyingcriticalhabitatcorridors;;publication{journal:ConservationBiology;status:underreview}
9;BehavioralEconomicsandConsumerDecisionMaking;;;{Experimentalstudiesoncognitivebiasesinpurchasingbehavior;randomizedcontrolledtrialswitheye-trackingtechnology;anchoringeffectspersistevenwithexpertconsumers};keywords:behavioraleconomics,decisiontheory,consumerpsychology;category:Psychology
10;;{Prof.MichaelThompson;OxfordUniversity;EngineeringScience;DepartmentChair};Novelsynthesismethodsforhigh-performanceceramiccomposites;;publication{journal:AdvancedMaterials;volume:thirty-six;status:accepted};tags[materialsscience;ceramics;nanotechnology]
mcp_tools_list.json — Original: 51663 chars — Tokenizer: llama (NousResearch/Llama-2-7b-hf)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)51,66313,5393.83.8
JSON (min)30,7247,3157.14.2
CSVN/A
TSVN/A
YAML38,1398,9155.84.3
TOON38,3768,6496.04.4
TSON25,8787,0457.33.7
minemizer23,3835,7679.04.1
minemizer (compact)21,9125,7269.03.8
JSON (pretty)
chars: 51,663 tokens: 13,539 chars_og/tok: 3.8 enc_chars/tok: 3.8
<s>[
{
··"inputSchema":{
····"json":{
······"properties":{
········"body":{
··········"description":"Commentcontent",
··········"type":"string"
········},
········"issue_number":{
··········"description":"Issuenumbertocommenton",
··········"type":"number"
········},
········"owner":{
··········"description":"Repositoryowner",
··········"type":"string"
········},
········"repo":{
··········"description":"Repositoryname",
··········"type":"string"
········}
······},
······"required":[
········"owner",
········"repo",
... (truncated)
JSON (min)
chars: 30,724 tokens: 7,315 chars_og/tok: 7.1 enc_chars/tok: 4.2
<s>[{"inputSchema":{"json":{"properties":{"body":{"description":"Commentcontent","type":"string"},"issue_number":{"description":"Issuenumbertocommenton","type":"number"},"owner":{"description":"Repositoryowner","type":"string"},"repo":{"description":"Repositoryname","type":"string"}},"required":["owner","repo","issue_number","body"],"type":"object"}},"name":"add_issue_comment","description":"AddacommenttoaspecificissueinaGitHubrepository."},{"inputSchema":{"json":{"properties":{"body":{"description":"Thetextofthereviewcomment","type":"string"},"line":{"description":"Thelineoftheblobinthepullrequestdiffthatthecommentappliesto.Formulti-linecomments,thelastlineoftherange","type":"number"},"owner":{"description":"Repositoryowner","type":"string"},"path":{"description":"Therelativepathtothefilethatnecessitatesacomment","type":"string"},"pullNumber":{"description":"Pullrequestnumber","type":"number"},"repo":{"description":"Repositoryname","type":"string"},"side":{"description":"Thesideofthedifftocommenton.LEFTindicatesthepreviousstate,RIGHTindicatesthenewstate","enum":["LEFT","RIGHT"],"type":"string"},"startLine":{"description":"Formulti-linecomments,thefirstlineoftherangethatthecommentappliesto","type":"number"},"startSide":{"description":"Formulti-linecomments,thestartingsideofthediffthatthecommentappliesto.LEFTindicatesthepreviousstate,RIGHTindicatesthenewstate","enum":["LEFT","RIGHT"],"type":"string"},"subjectType":{"description":"Thelevelatwhichthecommentistargeted","enum":["FILE","LINE"],"type":"string"}},"required":["owner","repo","pullNumber","path","body","subjectType"],"type":"object"}},"name":"add_pull_request_review_comment_to_pending_review","description":"Addacommenttotherequester'slatestpendingpullrequestreview,apendingreviewneedstoalreadyexisttocallthis(checkwiththeuserifnotsure)."},{"inputSchema":{"json":{"properties":{"issueNumber":{"description":"Issuenumber","type":"number"},"owner":{"description":"Repositoryowner","type":"string"},"repo":{"description":"Repositoryname","type":"string"}},"required":["owner","repo","issueNumber"],"type":"object"}},"name":"assign_copilot_to_issue","description":"AssignCopilottoaspecificissueinaGitHubrepository.\n\nThistoolcanhelpwiththefollowingoutcomes:\n-aPullRequestcreatedwithsourcecodechangestoresolvetheissue\n\n\nMoreinformationcanbefoundat:\n-https://docs.github.com/en/copilot/using-github-copilot/using-copilot-coding-agent-to-work-on-tasks/about-assigning-tasks-to-copilot\n"},{"inputSchema":{"json":{"properties":{"body":{"description":"Reviewcommenttext","type":"string"},"commitID":{"description":"SHAofcommittoreview","type":"string"},"event":{"description":"Reviewactiontoperform","enum":["APPROVE","REQUEST_CHANGES","COMMENT"],"type":"string"},"owner":{"description":"Repositoryowner","type":"string"},"pullNumber":{"description":"Pullrequestnumber","type":"number"},"repo":{"description":"Repositoryname","type":"string"}},"required":["owner","repo","pullNumber","body","event"],"type":"object"}},"name":"create_and_submit_pull_request_review","description":"Createandsubmitareviewforapullrequestwithoutreviewcomments."},{"inputSchema":{"json":{"properties":{"branch":{"description":"Namefornewbranch","type":"string"},"from_branch":{"description":"Sourcebranch(defaultstorepodefault)","type":"string"},"owner":{"description":"Repositoryowner","type":"string"},"repo":{"description":"Repositoryname","type":"string"}},"required":["owner","repo","branch"],"type":"object"}},"name":"create_branch","description":"CreateanewbranchinaGitHubrepository"},{"inputSchema":{"json":{"properties":{"assignees":{"description":"Usernamestoassigntothisissue","items":{"type":"string"},"type":"array"},"body":{"description":"Issuebodycontent","type":"string"},"labels":{"description":"Labelstoapplytothisissue","items":{"type":"string"},"type":"array"},"milestone":{"description":"Milestonenumber","type":"number"},"owner":{"description":"Repositoryowner","type":"string"},"repo":{"description":"Repositoryname","type":"string"},"title":{"description":"Issuetitle","type":"string"}},"required":["owner","repo","title"],"type":"object"}},"name":"create_issue","description":"CreateanewissueinaGitHubrepository."},{"inputSchema":{"json":{"properties":{"branch":{"description":"Branchtocreate/updatethefilein","type":"string"},"content":{"description":"Contentofthefile","type":"string"},"message":{"description":"Commitmessage","type":"string"},"owner":{"description":"Repositoryowner(usernameororganization)","type":"string"},"path":{"description":"Pathwheretocreate/updatethefile","type":"string"},"repo":{"description":"Repositoryname","type":"string"},"sha":{"description":"SHAoffilebeingreplaced(forupdates)","type":"string"}},"required":["ow
... (truncated)
CSV: N/A
TSV: N/A
YAML
chars: 38,139 tokens: 8,915 chars_og/tok: 5.8 enc_chars/tok: 4.3
<s>-description:AddacommenttoaspecificissueinaGitHubrepository.
inputSchema:
··json:
····properties:
······body:
········description:Commentcontent
········type:string
······issue_number:
········description:Issuenumbertocommenton
········type:number
······owner:
········description:Repositoryowner
········type:string
······repo:
········description:Repositoryname
········type:string
····required:
····-owner
····-repo
····-issue_number
····-body
····type:object
name:add_issue_comment
-description:Addacommenttotherequester'slatestpendingpullrequestreview,
··apendingreviewneedstoalreadyexisttocallthis(checkwiththeuserifnot
... (truncated)
TOON
chars: 38,376 tokens: 8,649 chars_og/tok: 6.0 enc_chars/tok: 4.4
<s>[51]:
-
··inputSchema:
····json:
······properties:
········body:
··········description:Commentcontent
··········type:string
········issue_number:
··········description:Issuenumbertocommenton
··········type:number
········owner:
··········description:Repositoryowner
··········type:string
········repo:
··········description:Repositoryname
··········type:string
······required[4]:owner,repo,issue_number,body
······type:object
··name:add_issue_comment
··description:AddacommenttoaspecificissueinaGitHubrepository.
-
··inputSchema:
····json:
······properties:
... (truncated)
TSON
chars: 25,878 tokens: 7,045 chars_og/tok: 7.3 enc_chars/tok: 3.7
<s>{@inputSchema(@json),name,description#51|{{@properties,required,type|{@body,issue_number,owner,repo|{@description,type|"Commentcontent",string},{@description,type|"Issuenumbertocommenton",number},{@description,type|"Repositoryowner",string},{@description,type|"Repositoryname",string}},[owner,repo,issue_number,body],object}},add_issue_comment,"AddacommenttoaspecificissueinaGitHubrepository."|{{@properties,required,type|{@body,line,owner,path,pullNumber,repo,side,startLine,startSide,subjectType|{@description,type|"Thetextofthereviewcomment",string},{@description,type|"Thelineoftheblobinthepullrequestdiffthatthecommentappliesto.Formulti-linecomments,thelastlineoftherange",number},{@description,type|"Repositoryowner",string},{@description,type|"Therelativepathtothefilethatnecessitatesacomment",string},{@description,type|"Pullrequestnumber",number},{@description,type|"Repositoryname",string},{@description,enum,type|"Thesideofthedifftocommenton.LEFTindicatesthepreviousstate,RIGHTindicatesthenewstate",[LEFT,RIGHT],string},{@description,type|"Formulti-linecomments,thefirstlineoftherangethatthecommentappliesto",number},{@description,enum,type|"Formulti-linecomments,thestartingsideofthediffthatthecommentappliesto.LEFTindicatesthepreviousstate,RIGHTindicatesthenewstate",[LEFT,RIGHT],string},{@description,enum,type|"Thelevelatwhichthecommentistargeted",[FILE,LINE],string}},[owner,repo,pullNumber,path,body,subjectType],object}},add_pull_request_review_comment_to_pending_review,"Addacommenttotherequester'slatestpendingpullrequestreview,apendingreviewneedstoalreadyexisttocallthis(checkwiththeuserifnotsure)."|{{@properties,required,type|{@issueNumber,owner,repo|{@description,type|"Issuenumber",number},{@description,type|"Repositoryowner",string},{@description,type|"Repositoryname",string}},[owner,repo,issueNumber],object}},assign_copilot_to_issue,"AssignCopilottoaspecificissueinaGitHubrepository.\n\nThistoolcanhelpwiththefollowingoutcomes:\n-aPullRequestcreatedwithsourcecodechangestoresolvetheissue\n\n\nMoreinformationcanbefoundat:\n-https://docs.github.com/en/copilot/using-github-copilot/using-copilot-coding-agent-to-work-on-tasks/about-assigning-tasks-to-copilot\n"|{{@properties,required,type|{@body,commitID,event,owner,pullNumber,repo|{@description,type|"Reviewcommenttext",string},{@description,type|"SHAofcommittoreview",string},{@description,enum,type|"Reviewactiontoperform",[APPROVE,REQUEST_CHANGES,COMMENT],string},{@description,type|"Repositoryowner",string},{@description,type|"Pullrequestnumber",number},{@description,type|"Repositoryname",string}},[owner,repo,pullNumber,body,event],object}},create_and_submit_pull_request_review,"Createandsubmitareviewforapullrequestwithoutreviewcomments."|{{@properties,required,type|{@branch,from_branch,owner,repo|{@description,type|"Namefornewbranch",string},{@description,type|"Sourcebranch(defaultstorepodefault)",string},{@description,type|"Repositoryowner",string},{@description,type|"Repositoryname",string}},[owner,repo,branch],object}},create_branch,"CreateanewbranchinaGitHubrepository"|{{@properties,required,type|{@assignees,body,labels,milestone,owner,repo,title|{@description,items,type|"Usernamestoassigntothisissue",{@type|string},array},{@description,type|"Issuebodycontent",string},{@description,items,type|"Labelstoapplytothisissue",{@type|string},array},{@description,type|"Milestonenumber",number},{@description,type|"Repositoryowner",string},{@description,type|"Repositoryname",string},{@description,type|"Issuetitle",string}},[owner,repo,title],object}},create_issue,"CreateanewissueinaGitHubrepository."|{{@properties,required,type|{@branch,content,message,owner,path,repo,sha|{@description,type|"Branchtocreate/updatethefilein",string},{@description,type|"Contentofthefile",string},{@description,type|"Commitmessage",string},{@description,type|"Repositoryowner(usernameororganization)",string},{@description,type|"Pathwheretocreate/updatethefile",string},{@description,type|"Repositoryname",string},{@description,type|"SHAoffilebeingreplaced(forupdates)",string}},[owner,repo,path,content,message,branch],object}},create_or_update_file,"CreateorupdateasinglefileinaGitHubrepository.Ifupdating,youmustprovidetheSHAofthefileyouwanttoupdate."|{{@properties,required,type|{@commitID,owner,pullNumber,repo|{@description,type|"SHAofcommittoreview",string},{@description,type|"Repositoryowner",string},{@description,type|"Pullrequestnumber",number},{@description,type|"Repositoryname",string}},[owner,repo,pullNumber],object}},create_pending_pull_request_review,"Createapendingreviewforapullrequest.Callthisfirstbeforeattemptingtoaddcommentstoapendingreview,andultimatelysubmittingit
... (truncated)
minemizer
chars: 23,383 tokens: 5,767 chars_og/tok: 9.0 enc_chars/tok: 4.1
<s>inputSchema{json{properties{owner{description;type};repo{description;type};...};required[];type}};name;description
{{{{Repositoryowner;string};{Repositoryname;string};body:{description:Commentcontent;type:string};issue_number:{description:Issuenumbertocommenton;type:number}};[owner;repo;issue_number;body];object}};add_issue_comment;AddacommenttoaspecificissueinaGitHubrepository.
{{{{Repositoryowner;string};{Repositoryname;string};body:{description:Thetextofthereviewcomment;type:string};line:{description:Thelineoftheblobinthepullrequestdiffthatthecommentappliesto.Formulti-linecomments,thelastlineoftherange;type:number};path:{description:Therelativepathtothefilethatnecessitatesacomment;type:string};pullNumber:{description:Pullrequestnumber;type:number};side:{description:Thesideofthedifftocommenton.LEFTindicatesthepreviousstate,RIGHTindicatesthenewstate;enum:[LEFT;RIGHT];type:string};startLine:{description:Formulti-linecomments,thefirstlineoftherangethatthecommentappliesto;type:number};startSide:{description:Formulti-linecomments,thestartingsideofthediffthatthecommentappliesto.LEFTindicatesthepreviousstate,RIGHTindicatesthenewstate;enum:[LEFT;RIGHT];type:string};subjectType:{description:Thelevelatwhichthecommentistargeted;enum:[FILE;LINE];type:string}};[owner;repo;pullNumber;path;body;subjectType];object}};add_pull_request_review_comment_to_pending_review;Addacommenttotherequester'slatestpendingpullrequestreview,apendingreviewneedstoalreadyexisttocallthis(checkwiththeuserifnotsure).
{{{{Repositoryowner;string};{Repositoryname;string};issueNumber:{description:Issuenumber;type:number}};[owner;repo;issueNumber];object}};assign_copilot_to_issue;AssignCopilottoaspecificissueinaGitHubrepository.

Thistoolcanhelpwiththefollowingoutcomes:
-aPullRequestcreatedwithsourcecodechangestoresolvetheissue


Moreinformationcanbefoundat:
-https://docs.github.com/en/copilot/using-github-copilot/using-copilot-coding-agent-to-work-on-tasks/about-assigning-tasks-to-copilot

{{{{Repositoryowner;string};{Repositoryname;string};body:{description:Reviewcommenttext;type:string};commitID:{description:SHAofcommittoreview;type:string};event:{description:Reviewactiontoperform;enum:[APPROVE;REQUEST_CHANGES;COMMENT];type:string};pullNumber:{description:Pullrequestnumber;type:number}};[owner;repo;pullNumber;body;event];object}};create_and_submit_pull_request_review;Createandsubmitareviewforapullrequestwithoutreviewcomments.
{{{{Repositoryowner;string};{Repositoryname;string};branch:{description:Namefornewbranch;type:string};from_branch:{description:Sourcebranch(defaultstorepodefault);type:string}};[owner;repo;branch];object}};create_branch;CreateanewbranchinaGitHubrepository
{{{{Repositoryowner;string};{Repositoryname;string};assignees:{description:Usernamestoassigntothisissue;items:{type:string};type:array};body:{description:Issuebodycontent;type:string};labels:{description:Labelstoapplytothisissue;items:{type:string};type:array};milestone:{description:Milestonenumber;type:number};title:{description:Issuetitle;type:string}};[owner;repo;title];object}};create_issue;CreateanewissueinaGitHubrepository.
{{{{Repositoryowner(usernameororganization);string};{Repositoryname;string};branch:{description:Branchtocreate/updatethefilein;type:string};content:{description:Contentofthefile;type:string};message:{description:Commitmessage;type:string};path:{description:Pathwheretocreate/updatethefile;type:string};sha:{description:SHAoffilebeingreplaced(forupdates);type:string}};[owner;repo;path;content;message;branch];object}};create_or_update_file;CreateorupdateasinglefileinaGitHubrepository.Ifupdating,youmustprovidetheSHAofthefileyouwanttoupdate.
{{{{Repositoryowner;string};{Repositoryname;string};commitID:{description:SHAofcommittoreview;type:string};pullNumber:{description:Pullrequestnumber;type:number}};[owner;repo;pullNumber];object}};create_pending_pull_request_review;Createapendingreviewforapullrequest.Callthisfirstbeforeattemptingtoaddcommentstoapendingreview,andultimatelysubmittingit.Apendingpullrequestreviewmeansapullrequestreview,itispendingbecauseyoucreateitfirstandsubmititlater,andthePRauthorwillnotseeituntilitissubmitted.
{{{{Repositoryowner;string};{Repositoryname;string};base:{description:Branchtomergeinto;type:string};body:{description:PRdescription;type:string};draft:{description:CreateasdraftPR;type:boolean};head:{description:Branchcontainingchanges;type:string};maintainer_can_modify:{description:Allowmaintaineredits;type:boolean};title:{description:PRtitle;type:string}};[owner;repo;title;head;base];object}};create_pull_request;CreateanewpullrequestinaGitHubrepository.
{{{;;autoInit:{description:InitializewithREADME;type:boolean};description:{description:Repositorydescription;type:string};name:{description:Repositoryname;type:string};private:{description:Whetherreposhouldbeprivate;type:boolean}};[name];object}};create_repository;CreateanewGitHubrepositoryinyouraccount
{{{{Repositoryowner(usernameororganization);string};{Repositoryname;string};branch:{description:Branchtodeletethefilefrom;type:string};message:{description:Commitmessage;type:string};path:{description:Pathtothefiletodelete;type:string}};[owner;repo;path;message;branch];object}};delete_file;DeleteafilefromaGitHubrepository
{{{{Repositoryowner;string};{Repositoryname;string};pullNumber:{description:Pullrequestnumber;type:number}};[owner;repo;pullNumber];object}};delete_pending_pull_request_review;Deletetherequester'slatestpendingpullrequestreview.Usethisaftertheuserdecidesnottosubmitapendingreview,ifyoudon'tknowiftheyalreadycreatedonethencheckfirst.
{{{;;state:{description:Thenewstateofthenotification(read/done);enum:[read;done];type:string};threadID:{description:TheIDofthenotificationthread;type:string}};[threadID];object}};dismiss_notification;Dismissanotificationbymarkingitasreadordone
{{{{Repositoryowner;string};{Repositoryname;string};organization:{description:Organizationtoforkto;type:string}};[owner;repo];object}};fork_repository;ForkaGitHubrepositorytoyouraccountorspecifiedorganization
{{{{Theowneroftherepository.;string};{Thenameoftherepository.;string};alertNumber:{description:Thenumberofthealert.;type:number}};[owner;repo;alertNumber];object}};get_code_scanning_alert;GetdetailsofaspecificcodescanningalertinaGitHubrepository.
{{{{Repositoryowner;string};{Repositoryname;string};page:{description:Pagenumberforpagination(min1);minimum:1;type:number};perPage:{description:Resultsperpageforpagination(min1,max100);maximum:100;minimum:1;type:number};sha:{description:CommitSHA,branchname,ortagname;type:string}};[owner;repo;sha];object}};get_commit;GetdetailsforacommitfromaGitHubrepository
... (truncated)
minemizer (compact)
chars: 21,912 tokens: 5,726 chars_og/tok: 9.0 enc_chars/tok: 3.8
<s>inputSchema{json{properties{owner{description;type};repo{description;type};...};required[];type}};name;description
{{{{Repositoryowner;string};{Repositoryname;string};body:{description:Commentcontent;type:string};issue_number:{description:Issuenumbertocommenton;type:number}};[owner;repo;issue_number;body];object}};add_issue_comment;AddacommenttoaspecificissueinaGitHubrepository.
{{{{Repositoryowner;string};{Repositoryname;string};body:{description:Thetextofthereviewcomment;type:string};line:{description:Thelineoftheblobinthepullrequestdiffthatthecommentappliesto.Formulti-linecomments,thelastlineoftherange;type:number};path:{description:Therelativepathtothefilethatnecessitatesacomment;type:string};pullNumber:{description:Pullrequestnumber;type:number};side:{description:Thesideofthedifftocommenton.LEFTindicatesthepreviousstate,RIGHTindicatesthenewstate;enum:[LEFT;RIGHT];type:string};startLine:{description:Formulti-linecomments,thefirstlineoftherangethatthecommentappliesto;type:number};startSide:{description:Formulti-linecomments,thestartingsideofthediffthatthecommentappliesto.LEFTindicatesthepreviousstate,RIGHTindicatesthenewstate;enum:[LEFT;RIGHT];type:string};subjectType:{description:Thelevelatwhichthecommentistargeted;enum:[FILE;LINE];type:string}};[owner;repo;pullNumber;path;body;subjectType];object}};add_pull_request_review_comment_to_pending_review;Addacommenttotherequester'slatestpendingpullrequestreview,apendingreviewneedstoalreadyexisttocallthis(checkwiththeuserifnotsure).
{{{{Repositoryowner;string};{Repositoryname;string};issueNumber:{description:Issuenumber;type:number}};[owner;repo;issueNumber];object}};assign_copilot_to_issue;AssignCopilottoaspecificissueinaGitHubrepository.

Thistoolcanhelpwiththefollowingoutcomes:
-aPullRequestcreatedwithsourcecodechangestoresolvetheissue


Moreinformationcanbefoundat:
-https://docs.github.com/en/copilot/using-github-copilot/using-copilot-coding-agent-to-work-on-tasks/about-assigning-tasks-to-copilot

{{{{Repositoryowner;string};{Repositoryname;string};body:{description:Reviewcommenttext;type:string};commitID:{description:SHAofcommittoreview;type:string};event:{description:Reviewactiontoperform;enum:[APPROVE;REQUEST_CHANGES;COMMENT];type:string};pullNumber:{description:Pullrequestnumber;type:number}};[owner;repo;pullNumber;body;event];object}};create_and_submit_pull_request_review;Createandsubmitareviewforapullrequestwithoutreviewcomments.
{{{{Repositoryowner;string};{Repositoryname;string};branch:{description:Namefornewbranch;type:string};from_branch:{description:Sourcebranch(defaultstorepodefault);type:string}};[owner;repo;branch];object}};create_branch;CreateanewbranchinaGitHubrepository
{{{{Repositoryowner;string};{Repositoryname;string};assignees:{description:Usernamestoassigntothisissue;items:{type:string};type:array};body:{description:Issuebodycontent;type:string};labels:{description:Labelstoapplytothisissue;items:{type:string};type:array};milestone:{description:Milestonenumber;type:number};title:{description:Issuetitle;type:string}};[owner;repo;title];object}};create_issue;CreateanewissueinaGitHubrepository.
{{{{Repositoryowner(usernameororganization);string};{Repositoryname;string};branch:{description:Branchtocreate/updatethefilein;type:string};content:{description:Contentofthefile;type:string};message:{description:Commitmessage;type:string};path:{description:Pathwheretocreate/updatethefile;type:string};sha:{description:SHAoffilebeingreplaced(forupdates);type:string}};[owner;repo;path;content;message;branch];object}};create_or_update_file;CreateorupdateasinglefileinaGitHubrepository.Ifupdating,youmustprovidetheSHAofthefileyouwanttoupdate.
{{{{Repositoryowner;string};{Repositoryname;string};commitID:{description:SHAofcommittoreview;type:string};pullNumber:{description:Pullrequestnumber;type:number}};[owner;repo;pullNumber];object}};create_pending_pull_request_review;Createapendingreviewforapullrequest.Callthisfirstbeforeattemptingtoaddcommentstoapendingreview,andultimatelysubmittingit.Apendingpullrequestreviewmeansapullrequestreview,itispendingbecauseyoucreateitfirstandsubmititlater,andthePRauthorwillnotseeituntilitissubmitted.
{{{{Repositoryowner;string};{Repositoryname;string};base:{description:Branchtomergeinto;type:string};body:{description:PRdescription;type:string};draft:{description:CreateasdraftPR;type:boolean};head:{description:Branchcontainingchanges;type:string};maintainer_can_modify:{description:Allowmaintaineredits;type:boolean};title:{description:PRtitle;type:string}};[owner;repo;title;head;base];object}};create_pull_request;CreateanewpullrequestinaGitHubrepository.
{{{;;autoInit:{description:InitializewithREADME;type:boolean};description:{description:Repositorydescription;type:string};name:{description:Repositoryname;type:string};private:{description:Whetherreposhouldbeprivate;type:boolean}};[name];object}};create_repository;CreateanewGitHubrepositoryinyouraccount
{{{{Repositoryowner(usernameororganization);string};{Repositoryname;string};branch:{description:Branchtodeletethefilefrom;type:string};message:{description:Commitmessage;type:string};path:{description:Pathtothefiletodelete;type:string}};[owner;repo;path;message;branch];object}};delete_file;DeleteafilefromaGitHubrepository
{{{{Repositoryowner;string};{Repositoryname;string};pullNumber:{description:Pullrequestnumber;type:number}};[owner;repo;pullNumber];object}};delete_pending_pull_request_review;Deletetherequester'slatestpendingpullrequestreview.Usethisaftertheuserdecidesnottosubmitapendingreview,ifyoudon'tknowiftheyalreadycreatedonethencheckfirst.
{{{;;state:{description:Thenewstateofthenotification(read/done);enum:[read;done];type:string};threadID:{description:TheIDofthenotificationthread;type:string}};[threadID];object}};dismiss_notification;Dismissanotificationbymarkingitasreadordone
{{{{Repositoryowner;string};{Repositoryname;string};organization:{description:Organizationtoforkto;type:string}};[owner;repo];object}};fork_repository;ForkaGitHubrepositorytoyouraccountorspecifiedorganization
{{{{Theowneroftherepository.;string};{Thenameoftherepository.;string};alertNumber:{description:Thenumberofthealert.;type:number}};[owner;repo;alertNumber];object}};get_code_scanning_alert;GetdetailsofaspecificcodescanningalertinaGitHubrepository.
{{{{Repositoryowner;string};{Repositoryname;string};page:{description:Pagenumberforpagination(min1);minimum:1;type:number};perPage:{description:Resultsperpageforpagination(min1,max100);maximum:100;minimum:1;type:number};sha:{description:CommitSHA,branchname,ortagname;type:string}};[owner;repo;sha];object}};get_commit;GetdetailsforacommitfromaGitHubrepository
... (truncated)
simple_flat.json — Original: 763 chars — Tokenizer: qwen2.5 (Qwen/Qwen2.5-0.5B)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)7632642.92.9
JSON (min)5221375.63.8
CSV234779.93.0
TSV234779.93.0
YAML4891694.52.9
TOON246967.92.6
TSON229809.52.9
minemizer2517210.63.5
minemizer (compact)224779.92.9
JSON (pretty)
chars: 763 tokens: 264 chars_og/tok: 2.9 enc_chars/tok: 2.9
[↵
· {↵
··· "id":·1,↵
··· "name": "Alice",↵
··· "role": "Engineer",↵
··· "department": "Backend"↵
· },↵
· {↵
··· "id":·2,↵
··· "name": "Bob",↵
··· "role": "Designer",↵
··· "department": "Frontend"↵
· },↵
· {↵
··· "id":·3,↵
··· "name": "Carol",↵
··· "role": "Manager",↵
··· "department": "Product"↵
· },↵
· {↵
··· "id":·4,↵
··· "name": "David",↵
··· "role": "Engineer",↵
··· "department": "Infrastructure"↵
· },
... (truncated)
JSON (min)
chars: 522 tokens: 137 chars_og/tok: 5.6 enc_chars/tok: 3.8
[{"id":1,"name":"Alice","role":"Engineer","department":"Backend"},{"id":2,"name":"Bob","role":"Designer","department":"Frontend"},{"id":3,"name":"Carol","role":"Manager","department":"Product"},{"id":4,"name":"David","role":"Engineer","department":"Infrastructure"},{"id":5,"name":"Eva","role":"Analyst","department":"Data"},{"id":6,"name":"Frank","role":"Engineer","department":"Backend"},{"id":7,"name":"Grace","role":"Designer","department":"Mobile"},{"id":8,"name":"Henry","role":"Manager","department":"Engineering"}]
CSV
chars: 234 tokens: 77 chars_og/tok: 9.9 enc_chars/tok: 3.0
id,name,role,department
1,Alice,Engineer,Backend
2,Bob,Designer,Frontend
3,Carol,Manager,Product
4,David,Engineer,Infrastructure
5,Eva,Analyst,Data
6,Frank,Engineer,Backend
7,Grace,Designer,Mobile
8,Henry,Manager,Engineering
TSV
chars: 234 tokens: 77 chars_og/tok: 9.9 enc_chars/tok: 3.0
id nameroledepartment
1 AliceEngineerBackend
2 BobDesigner Frontend
3 CarolManagerProduct
4 DavidEngineerInfrastructure
5 EvaAnalyst Data
6 FrankEngineerBackend
7GraceDesigner Mobile
8 HenryManagerEngineering
YAML
chars: 489 tokens: 169 chars_og/tok: 4.5 enc_chars/tok: 2.9
- department: Backend
· id:·1
· name: Alice
· role: Engineer
- department: Frontend
· id:·2
· name: Bob
· role: Designer
- department: Product
· id:·3
· name: Carol
· role: Manager
- department: Infrastructure
· id:·4
· name: David
· role: Engineer
- department: Data
· id:·5
· name: Eva
· role: Analyst
- department: Backend
· id:·6
· name: Frank
· role: Engineer
- department: Mobile
... (truncated)
TOON
chars: 246 tokens: 96 chars_og/tok: 7.9 enc_chars/tok: 2.6
[8]{id,name,role,department}:↵
··1,Alice,Engineer,Backend
··2,Bob,Designer,Frontend
··3,Carol,Manager,Product
··4,David,Engineer,Infrastructure
··5,Eva,Analyst,Data
··6,Frank,Engineer,Backend
··7,Grace,Designer,Mobile
··8,Henry,Manager,Engineering
TSON
chars: 229 tokens: 80 chars_og/tok: 9.5 enc_chars/tok: 2.9
{@id,name,role,department#8|1,Alice,Engineer,Backend|2,Bob,Designer,Frontend|3,Carol,Manager,Product|4,David,Engineer,Infrastructure|5,Eva,Analyst,Data|6,Frank,Engineer,Backend|7,Grace,Designer,Mobile|8,Henry,Manager,Engineering}
minemizer
chars: 251 tokens: 72 chars_og/tok: 10.6 enc_chars/tok: 3.5
id; name; role; department
1; Alice; Engineer; Backend
2; Bob; Designer; Frontend
3; Carol; Manager; Product
4; David; Engineer; Infrastructure
5; Eva; Analyst; Data
6; Frank; Engineer; Backend
7; Grace; Designer; Mobile
8; Henry; Manager; Engineering
minemizer (compact)
chars: 224 tokens: 77 chars_og/tok: 9.9 enc_chars/tok: 2.9
id;name;role;department
1;Alice;Engineer;Backend
2;Bob;Designer;Frontend
3;Carol;Manager;Product
4;David;Engineer;Infrastructure
5;Eva;Analyst;Data
6;Frank;Engineer;Backend
7;Grace;Designer;Mobile
8;Henry;Manager;Engineering
nested_objects.json — Original: 1039 chars — Tokenizer: qwen2.5 (Qwen/Qwen2.5-0.5B)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)1,0393483.03.0
JSON (min)6181746.03.6
CSVN/A
TSVN/A
YAML6292294.52.7
TOON6752234.73.0
TSON3061109.42.8
minemizer3251218.62.7
minemizer (compact)2901178.92.5
JSON (pretty)
chars: 1,039 tokens: 348 chars_og/tok: 3.0 enc_chars/tok: 3.0
[↵
· {↵
··· "id": "u1",↵
··· "name": "Lukas",↵
··· "location": {↵
····· "office": "Kaunas HQ",↵
····· "floor":·12
··· },↵
··· "skills": [↵
····· "python",↵
····· "kubernetes"↵
··· ]↵
· },↵
· {↵
··· "id": "u2",↵
··· "name": "Emma",↵
··· "location": {↵
····· "office": "Boston Hub",↵
····· "floor":·7
··· },↵
··· "skills": [↵
····· "react",↵
····· "typescript",↵
····· "graphql"↵
··· ]
... (truncated)
JSON (min)
chars: 618 tokens: 174 chars_og/tok: 6.0 enc_chars/tok: 3.6
[{"id":"u1","name":"Lukas","location":{"office":"Kaunas HQ","floor":12},"skills":["python","kubernetes"]},{"id":"u2","name":"Emma","location":{"office":"Boston Hub","floor":7},"skills":["react","typescript","graphql"]},{"id":"u3","name":"Pierre","location":{"office":"Paris Office","floor":3},"skills":["rust"]},{"id":"u4","name":"Hana","location":{"office":"Tokyo Tower","floor":15},"skills":["go","docker"]},{"id":"u5","name":"Wei","location":{"office":"Taipei Center","floor":8},"skills":["java","spring"]},{"id":"u6","name":"Charlotte","location":{"office":"London Bridge","floor":5},"skills":["python","django"]}]
CSV: N/A
TSV: N/A
YAML
chars: 629 tokens: 229 chars_og/tok: 4.5 enc_chars/tok: 2.7
- id: u1
· location:↵
··· floor:·12
··· office: Kaunas HQ
· name: Lukas
· skills:↵
· - python
· - kubernetes
- id: u2
· location:↵
··· floor:·7
··· office: Boston Hub
· name: Emma
· skills:↵
· - react
· - typescript
· - graphql
- id: u3
· location:↵
··· floor:·3
··· office: Paris Office
· name: Pierre
· skills:↵
· - rust
- id: u4
... (truncated)
TOON
chars: 675 tokens: 223 chars_og/tok: 4.7 enc_chars/tok: 3.0
[6]:↵
· - id: u1
··· name: Lukas
··· location:↵
····· office: Kaunas HQ
····· floor:·12
··· skills[2]: python,kubernetes
· - id: u2
··· name: Emma
··· location:↵
····· office: Boston Hub
····· floor:·7
··· skills[3]: react,typescript,graphql
· - id: u3
··· name: Pierre
··· location:↵
····· office: Paris Office
····· floor:·3
··· skills[1]: rust
· - id: u4
··· name: Hana
··· location:↵
····· office: Tokyo Tower
····· floor:·15
··· skills[2]: go,docker
... (truncated)
TSON
chars: 306 tokens: 110 chars_og/tok: 9.4 enc_chars/tok: 2.8
{@id,name,location(@office,floor),skills#6|u1,Lukas,{"Kaunas HQ",12},[python,kubernetes]|u2,Emma,{"Boston Hub",7},[react,typescript,graphql]|u3,Pierre,{"Paris Office",3},[rust]|u4,Hana,{"Tokyo Tower",15},[go,docker]|u5,Wei,{"Taipei Center",8},[java,spring]|u6,Charlotte,{"London Bridge",5},[python,django]}
minemizer
chars: 325 tokens: 121 chars_og/tok: 8.6 enc_chars/tok: 2.7
id; name; location{ office; floor}; skills[]↵
u1; Lukas;{ Kaunas HQ;·12};[ python; kubernetes]↵
u2; Emma;{ Boston Hub;·7};[ react; typescript; graphql]↵
u3; Pierre;{ Paris Office;·3};[ rust]↵
u4; Hana;{ Tokyo Tower;·15};[ go; docker]↵
u5; Wei;{ Taipei Center;·8};[ java; spring]↵
u6; Charlotte;{ London Bridge;·5};[ python; django]
minemizer (compact)
chars: 290 tokens: 117 chars_og/tok: 8.9 enc_chars/tok: 2.5
id;name;location{office;floor};skills[]↵
u1;Lukas;{Kaunas HQ;12};[python;kubernetes]↵
u2;Emma;{Boston Hub;7};[react;typescript;graphql]↵
u3;Pierre;{Paris Office;3};[rust]↵
u4;Hana;{Tokyo Tower;15};[go;docker]↵
u5;Wei;{Taipei Center;8};[java;spring]↵
u6;Charlotte;{London Bridge;5};[python;django]
lists_of_primitives.json — Original: 610 chars — Tokenizer: qwen2.5 (Qwen/Qwen2.5-0.5B)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)6102172.82.8
JSON (min)3301035.93.2
CSVN/A
TSVN/A
YAML3411494.12.3
TOON3391374.52.5
TSON168659.42.6
minemizer188718.62.6
minemizer (compact)165708.72.4
JSON (pretty)
chars: 610 tokens: 217 chars_og/tok: 2.8 enc_chars/tok: 2.8
[↵
· {↵
··· "id":·1,↵
··· "name": "Alice",↵
··· "skills": [↵
····· "python",↵
····· "go",↵
····· "rust"↵
··· ]↵
· },↵
· {↵
··· "id":·2,↵
··· "name": "Bob",↵
··· "skills": [↵
····· "javascript",↵
····· "typescript"↵
··· ]↵
· },↵
· {↵
··· "id":·3,↵
··· "name": "Carol",↵
··· "skills": [↵
····· "java",↵
····· "kotlin",↵
····· "scala",
... (truncated)
JSON (min)
chars: 330 tokens: 103 chars_og/tok: 5.9 enc_chars/tok: 3.2
[{"id":1,"name":"Alice","skills":["python","go","rust"]},{"id":2,"name":"Bob","skills":["javascript","typescript"]},{"id":3,"name":"Carol","skills":["java","kotlin","scala","groovy"]},{"id":4,"name":"David","skills":["c","cpp"]},{"id":5,"name":"Eva","skills":["ruby","elixir","erlang"]},{"id":6,"name":"Frank","skills":["swift"]}]
CSV: N/A
TSV: N/A
YAML
chars: 341 tokens: 149 chars_og/tok: 4.1 enc_chars/tok: 2.3
- id:·1
· name: Alice
· skills:↵
· - python
· - go
· - rust
- id:·2
· name: Bob
· skills:↵
· - javascript
· - typescript
- id:·3
· name: Carol
· skills:↵
· - java
· - kotlin
· - scala
· - groovy
- id:·4
· name: David
· skills:↵
· - c
· - cpp
- id:·5
· name: Eva
... (truncated)
TOON
chars: 339 tokens: 137 chars_og/tok: 4.5 enc_chars/tok: 2.5
[6]:↵
· - id:·1
··· name: Alice
··· skills[3]: python,go,rust
· - id:·2
··· name: Bob
··· skills[2]: javascript,typescript
· - id:·3
··· name: Carol
··· skills[4]: java,kotlin,scala,groovy
· - id:·4
··· name: David
··· skills[2]: c,cpp
· - id:·5
··· name: Eva
··· skills[3]: ruby,elixir,erlang
· - id:·6
··· name: Frank
··· skills[1]: swift
TSON
chars: 168 tokens: 65 chars_og/tok: 9.4 enc_chars/tok: 2.6
{@id,name,skills#6|1,Alice,[python,go,rust]|2,Bob,[javascript,typescript]|3,Carol,[java,kotlin,scala,groovy]|4,David,[c,cpp]|5,Eva,[ruby,elixir,erlang]|6,Frank,[swift]}
minemizer
chars: 188 tokens: 71 chars_og/tok: 8.6 enc_chars/tok: 2.6
id; name; skills[]↵
1; Alice;[ python; go; rust]↵
2; Bob;[ javascript; typescript]↵
3; Carol;[ java; kotlin; scala; groovy]↵
4; David;[ c; cpp]↵
5; Eva;[ ruby; elixir; erlang]↵
6; Frank;[ swift]
minemizer (compact)
chars: 165 tokens: 70 chars_og/tok: 8.7 enc_chars/tok: 2.4
id;name;skills[]↵
1;Alice;[python;go;rust]↵
2;Bob;[javascript;typescript]↵
3;Carol;[java;kotlin;scala;groovy]↵
4;David;[c;cpp]↵
5;Eva;[ruby;elixir;erlang]↵
6;Frank;[swift]
sparse_data.json — Original: 611 chars — Tokenizer: qwen2.5 (Qwen/Qwen2.5-0.5B)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)6112272.72.7
JSON (min)4001215.03.3
CSVN/A
TSVN/A
YAML3841494.12.6
TOON4381593.82.8
TSON3281135.42.9
minemizer200728.52.8
minemizer (compact)180748.32.4
JSON (pretty)
chars: 611 tokens: 227 chars_og/tok: 2.7 enc_chars/tok: 2.7
[↵
· {↵
··· "id":·1,↵
··· "name": "Erik",↵
··· "department": "Engineering"↵
· },↵
· {↵
··· "id":·2,↵
··· "name": "Rachel",↵
··· "department": "Design",↵
··· "remote": true
· },↵
· {↵
··· "id":·3,↵
··· "name": "Hans"↵
· },↵
· {↵
··· "id":·4,↵
··· "name": "Kenji",↵
··· "department": "Sales",↵
··· "slack": "@kenji",↵
··· "remote": false
· },↵
· {↵
··· "id":·5,
... (truncated)
JSON (min)
chars: 400 tokens: 121 chars_og/tok: 5.0 enc_chars/tok: 3.3
[{"id":1,"name":"Erik","department":"Engineering"},{"id":2,"name":"Rachel","department":"Design","remote":true},{"id":3,"name":"Hans"},{"id":4,"name":"Kenji","department":"Sales","slack":"@kenji","remote":false},{"id":5,"name":"Mai","remote":true},{"id":6,"name":"Tom","department":"Engineering"},{"id":7,"name":"Priya","slack":"@priya","remote":true},{"id":8,"name":"Nina","department":"Marketing"}]
CSV: N/A
TSV: N/A
YAML
chars: 384 tokens: 149 chars_og/tok: 4.1 enc_chars/tok: 2.6
- department: Engineering
· id:·1
· name: Erik
- department: Design
· id:·2
· name: Rachel
· remote: true
- id:·3
· name: Hans
- department: Sales
· id:·4
· name: Kenji
· remote: false
· slack: '@kenji'↵
- id:·5
· name: Mai
· remote: true
- department: Engineering
· id:·6
· name: Tom
- id:·7
· name: Priya
· remote: true
· slack: '@priya'↵
- department: Marketing
... (truncated)
TOON
chars: 438 tokens: 159 chars_og/tok: 3.8 enc_chars/tok: 2.8
[8]:↵
· - id:·1
··· name: Erik
··· department: Engineering
· - id:·2
··· name: Rachel
··· department: Design
··· remote: true
· - id:·3
··· name: Hans
· - id:·4
··· name: Kenji
··· department: Sales
··· slack: @kenji
··· remote: false
· - id:·5
··· name: Mai
··· remote: true
· - id:·6
··· name: Tom
··· department: Engineering
· - id:·7
··· name: Priya
··· slack: @priya
··· remote: true
... (truncated)
TSON
chars: 328 tokens: 113 chars_og/tok: 5.4 enc_chars/tok: 2.9
[{@id,name,department|1,Erik,Engineering},{@id,name,department,remote|2,Rachel,Design,true},{@id,name|3,Hans},{@id,name,department,slack,remote|4,Kenji,Sales,"@kenji",false},{@id,name,remote|5,Mai,true},{@id,name,department|6,Tom,Engineering},{@id,name,slack,remote|7,Priya,"@priya",true},{@id,name,department|8,Nina,Marketing}]
minemizer
chars: 200 tokens: 72 chars_og/tok: 8.5 enc_chars/tok: 2.8
id; name; department; remote
1; Erik; Engineering
2; Rachel; Design;true
3; Hans
4; Kenji; Sales;false; slack: @kenji
5; Mai;;true
6; Tom; Engineering
7; Priya;;true; slack: @priya
8; Nina; Marketing;
minemizer (compact)
chars: 180 tokens: 74 chars_og/tok: 8.3 enc_chars/tok: 2.4
id;name;department;remote
1;Erik;Engineering
2;Rachel;Design;true
3;Hans
4;Kenji;Sales;false;slack:@kenji
5;Mai;;true
6;Tom;Engineering
7;Priya;;true;slack:@priya
8;Nina;Marketing;
complex_mixed.json — Original: 1320 chars — Tokenizer: qwen2.5 (Qwen/Qwen2.5-0.5B)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)1,3204552.92.9
JSON (min)7602465.43.1
CSVN/A
TSVN/A
YAML8183064.32.7
TOON8813044.32.9
TSON4532036.52.2
minemizer4031936.82.1
minemizer (compact)3611906.91.9
JSON (pretty)
chars: 1,320 tokens: 455 chars_og/tok: 2.9 enc_chars/tok: 2.9
[↵
· {↵
··· "id":·1,↵
··· "profile": {↵
····· "name": "Grace",↵
····· "location": {↵
······· "city": "NYC",↵
······· "country": "USA"↵
····· }↵
··· },↵
··· "tags": [↵
····· "admin",↵
····· "verified"↵
··· ],↵
··· "metadata": {↵
····· "created": "2024-01-15"↵
··· }↵
· },↵
· {↵
··· "id":·2,↵
··· "profile": {↵
····· "name": "Henry",↵
····· "location": {↵
······· "city": "London",↵
······· "country": "UK"
... (truncated)
JSON (min)
chars: 760 tokens: 246 chars_og/tok: 5.4 enc_chars/tok: 3.1
[{"id":1,"profile":{"name":"Grace","location":{"city":"NYC","country":"USA"}},"tags":["admin","verified"],"metadata":{"created":"2024-01-15"}},{"id":2,"profile":{"name":"Henry","location":{"city":"London","country":"UK"}},"tags":["user"],"metadata":{"created":"2024-02-20","updated":"2024-03-10"}},{"id":3,"profile":{"name":"Ivy","location":{"city":"Tokyo","country":"Japan"}},"tags":["moderator","verified","premium"],"metadata":{"created":"2024-01-05"}},{"id":4,"profile":{"name":"Jack","location":{"city":"Sydney","country":"Australia"}},"tags":["user","new"],"metadata":{"created":"2024-04-01"}},{"id":5,"profile":{"name":"Kate","location":{"city":"Berlin","country":"Germany"}},"tags":["admin"],"metadata":{"created":"2023-12-01","updated":"2024-02-15"}}]
CSV: N/A
TSV: N/A
YAML
chars: 818 tokens: 306 chars_og/tok: 4.3 enc_chars/tok: 2.7
- id:·1
· metadata:↵
··· created: '2024-01-15'↵
· profile:↵
··· location:↵
····· city: NYC
····· country: USA
··· name: Grace
· tags:↵
· - admin
· - verified
- id:·2
· metadata:↵
··· created: '2024-02-20'↵
··· updated: '2024-03-10'↵
· profile:↵
··· location:↵
····· city: London
····· country: UK
··· name: Henry
· tags:↵
· - user
- id:·3
· metadata:↵
··· created: '2024-01-05'
... (truncated)
TOON
chars: 881 tokens: 304 chars_og/tok: 4.3 enc_chars/tok: 2.9
[5]:↵
· - id:·1
··· profile:↵
····· name: Grace
····· location:↵
······· city: NYC
······· country: USA
··· tags[2]: admin,verified
··· metadata:↵
····· created:·2024-01-15
· - id:·2
··· profile:↵
····· name: Henry
····· location:↵
······· city: London
······· country: UK
··· tags[1]: user
··· metadata:↵
····· created:·2024-02-20
····· updated:·2024-03-10
· - id:·3
··· profile:↵
····· name: Ivy
····· location:↵
······· city: Tokyo
... (truncated)
TSON
chars: 453 tokens: 203 chars_og/tok: 6.5 enc_chars/tok: 2.2
{@id,profile(@name,location),tags,metadata#5|1,{Grace,{@city,country|NYC,USA}},[admin,verified],{@created|2024-01-15}|2,{Henry,{@city,country|London,UK}},[user],{@created,updated|2024-02-20,2024-03-10}|3,{Ivy,{@city,country|Tokyo,Japan}},[moderator,verified,premium],{@created|2024-01-05}|4,{Jack,{@city,country|Sydney,Australia}},[user,new],{@created|2024-04-01}|5,{Kate,{@city,country|Berlin,Germany}},[admin],{@created,updated|2023-12-01,2024-02-15}}
minemizer
chars: 403 tokens: 193 chars_og/tok: 6.8 enc_chars/tok: 2.1
id; profile{ name; location{ city; country}}; tags[]; metadata{ created; ...}↵
1;{ Grace;{ NYC; USA}};[ admin; verified];{·2024-01-15}↵
2;{ Henry;{ London; UK}};[ user];{·2024-02-20; updated:·2024-03-10}↵
3;{ Ivy;{ Tokyo; Japan}};[ moderator; verified; premium];{·2024-01-05}↵
4;{ Jack;{ Sydney; Australia}};[ user; new];{·2024-04-01}↵
5;{ Kate;{ Berlin; Germany}};[ admin];{·2023-12-01; updated:·2024-02-15}
minemizer (compact)
chars: 361 tokens: 190 chars_og/tok: 6.9 enc_chars/tok: 1.9
id;profile{name;location{city;country}};tags[];metadata{created;...}↵
1;{Grace;{NYC;USA}};[admin;verified];{2024-01-15}↵
2;{Henry;{London;UK}};[user];{2024-02-20;updated:2024-03-10}↵
3;{Ivy;{Tokyo;Japan}};[moderator;verified;premium];{2024-01-05}↵
4;{Jack;{Sydney;Australia}};[user;new];{2024-04-01}↵
5;{Kate;{Berlin;Germany}};[admin];{2023-12-01;updated:2024-02-15}
books.json — Original: 27902 chars — Tokenizer: qwen2.5 (Qwen/Qwen2.5-0.5B)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)27,9029,4343.03.0
JSON (min)22,5016,6374.23.4
CSV14,0714,7995.82.9
TSV14,0574,8835.72.9
YAML22,4007,6053.72.9
TOON14,2774,8665.72.9
TSON14,4484,8455.83.0
minemizer14,4584,9765.62.9
minemizer (compact)13,7534,8475.82.8
JSON (pretty)
chars: 27,902 tokens: 9,434 chars_og/tok: 3.0 enc_chars/tok: 3.0
[↵
· {↵
··· "author": "Chinua Achebe",↵
··· "country": "Nigeria",↵
··· "imageLink": "images/things-fall-apart.jpg",↵
··· "language": "English",↵
··· "link": "https://en.wikipedia.org/wiki/Things_Fall_Apart\n",↵
··· "pages":·209,↵
··· "title": "Things Fall Apart",↵
··· "year":·1958
· },↵
· {↵
··· "author": "Hans Christian Andersen",↵
··· "country": "Denmark",↵
··· "imageLink": "images/fairy-tales.jpg",↵
··· "language": "Danish",↵
··· "link": "https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.\n",↵
··· "pages":·784,↵
··· "title": "Fairy tales",↵
··· "year":·1836
· },↵
· {↵
··· "author": "Dante Alighieri",↵
··· "country": "Italy",↵
··· "imageLink": "images/the-divine-comedy.jpg",
... (truncated)
JSON (min)
chars: 22,501 tokens: 6,637 chars_og/tok: 4.2 enc_chars/tok: 3.4
[{"author":"Chinua Achebe","country":"Nigeria","imageLink":"images/things-fall-apart.jpg","language":"English","link":"https://en.wikipedia.org/wiki/Things_Fall_Apart\n","pages":209,"title":"Things Fall Apart","year":1958},{"author":"Hans Christian Andersen","country":"Denmark","imageLink":"images/fairy-tales.jpg","language":"Danish","link":"https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.\n","pages":784,"title":"Fairy tales","year":1836},{"author":"Dante Alighieri","country":"Italy","imageLink":"images/the-divine-comedy.jpg","language":"Italian","link":"https://en.wikipedia.org/wiki/Divine_Comedy\n","pages":928,"title":"The Divine Comedy","year":1315},{"author":"Unknown","country":"Sumer and Akkadian Empire","imageLink":"images/the-epic-of-gilgamesh.jpg","language":"Akkadian","link":"https://en.wikipedia.org/wiki/Epic_of_Gilgamesh\n","pages":160,"title":"The Epic Of Gilgamesh","year":-1700},{"author":"Unknown","country":"Achaemenid Empire","imageLink":"images/the-book-of-job.jpg","language":"Hebrew","link":"https://en.wikipedia.org/wiki/Book_of_Job\n","pages":176,"title":"The Book Of Job","year":-600},{"author":"Unknown","country":"India/Iran/Iraq/Egypt/Tajikistan","imageLink":"images/one-thousand-and-one-nights.jpg","language":"Arabic","link":"https://en.wikipedia.org/wiki/One_Thousand_and_One_Nights\n","pages":288,"title":"One Thousand and One Nights","year":1200},{"author":"Unknown","country":"Iceland","imageLink":"images/njals-saga.jpg","language":"Old Norse","link":"https://en.wikipedia.org/wiki/Nj%C3%A1ls_saga\n","pages":384,"title":"Nj\u00e1l's Saga","year":1350},{"author":"Jane Austen","country":"United Kingdom","imageLink":"images/pride-and-prejudice.jpg","language":"English","link":"https://en.wikipedia.org/wiki/Pride_and_Prejudice\n","pages":226,"title":"Pride and Prejudice","year":1813},{"author":"Honor\u00e9 de Balzac","country":"France","imageLink":"images/le-pere-goriot.jpg","language":"French","link":"https://en.wikipedia.org/wiki/Le_P%C3%A8re_Goriot\n","pages":443,"title":"Le P\u00e8re Goriot","year":1835},{"author":"Samuel Beckett","country":"Republic of Ireland","imageLink":"images/molloy-malone-dies-the-unnamable.jpg","language":"French, English","link":"https://en.wikipedia.org/wiki/Molloy_(novel)\n","pages":256,"title":"Molloy, Malone Dies, The Unnamable, the trilogy","year":1952},{"author":"Giovanni Boccaccio","country":"Italy","imageLink":"images/the-decameron.jpg","language":"Italian","link":"https://en.wikipedia.org/wiki/The_Decameron\n","pages":1024,"title":"The Decameron","year":1351},{"author":"Jorge Luis Borges","country":"Argentina","imageLink":"images/ficciones.jpg","language":"Spanish","link":"https://en.wikipedia.org/wiki/Ficciones\n","pages":224,"title":"Ficciones","year":1965},{"author":"Emily Bront\u00eb","country":"United Kingdom","imageLink":"images/wuthering-heights.jpg","language":"English","link":"https://en.wikipedia.org/wiki/Wuthering_Heights\n","pages":342,"title":"Wuthering Heights","year":1847},{"author":"Albert Camus","country":"Algeria, French Empire","imageLink":"images/l-etranger.jpg","language":"French","link":"https://en.wikipedia.org/wiki/The_Stranger_(novel)\n","pages":185,"title":"The Stranger","year":1942},{"author":"Paul Celan","country":"Romania, France","imageLink":"images/poems-paul-celan.jpg","language":"German","link":"\n","pages":320,"title":"Poems","year":1952},{"author":"Louis-Ferdinand C\u00e9line","country":"France","imageLink":"images/voyage-au-bout-de-la-nuit.jpg","language":"French","link":"https://en.wikipedia.org/wiki/Journey_to_the_End_of_the_Night\n","pages":505,"title":"Journey to the End of the Night","year":1932},{"author":"Miguel de Cervantes","country":"Spain","imageLink":"images/don-quijote-de-la-mancha.jpg","language":"Spanish","link":"https://en.wikipedia.org/wiki/Don_Quixote\n","pages":1056,"title":"Don Quijote De La Mancha","year":1610},{"author":"Geoffrey Chaucer","country":"England","imageLink":"images/the-canterbury-tales.jpg","language":"English","link":"https://en.wikipedia.org/wiki/The_Canterbury_Tales\n","pages":544,"title":"The Canterbury Tales","year":1450},{"author":"Anton Chekhov","country":"Russia","imageLink":"images/stories-of-anton-chekhov.jpg","language":"Russian","link":"https://en.wikipedia.org/wiki/List_of_short_stories_by_Anton_Chekhov\n","pages":194,"title":"Stories","year":1886},{"author":"Joseph Conrad","country":"United Kingdom","imageLink":"images/nostromo.jpg","language":"English","link":"https://en.wikipedia.org/wiki/Nostromo\n","pages":320,"title":"Nostromo","year":1904},{"author":"Charles Dickens","country":"United Kingdom","imageLink":"images/great-expectations.jpg","language":"English","link":"https://en.wikipedia.org/wiki/Great_Expectations\n","pages":194,"title":"Great Expectations","year":1861},{"author":"Denis Diderot","country":"France","imageLink":"images/jacques-the-fatalist.jpg","language":"French","link":"https://en.wikipedia.org/wiki/Jacques_the_Fatalis
... (truncated)
CSV
chars: 14,071 tokens: 4,799 chars_og/tok: 5.8 enc_chars/tok: 2.9
author,country,imageLink,language,link,pages,title,year
Chinua Achebe,Nigeria,images/things-fall-apart.jpg,English,"https://en.wikipedia.org/wiki/Things_Fall_Apart
",209,Things Fall Apart,1958
Hans Christian Andersen,Denmark,images/fairy-tales.jpg,Danish,"https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.↵
",784,Fairy tales,1836
Dante Alighieri,Italy,images/the-divine-comedy.jpg,Italian,"https://en.wikipedia.org/wiki/Divine_Comedy
",928,The Divine Comedy,1315
Unknown,Sumer and Akkadian Empire,images/the-epic-of-gilgamesh.jpg,Akkadian,"https://en.wikipedia.org/wiki/Epic_of_Gilgamesh
",160,The Epic Of Gilgamesh,-1700
Unknown,Achaemenid Empire,images/the-book-of-job.jpg,Hebrew,"https://en.wikipedia.org/wiki/Book_of_Job
",176,The Book Of Job,-600
Unknown,India/Iran/Iraq/Egypt/Tajikistan,images/one-thousand-and-one-nights.jpg,Arabic,"https://en.wikipedia.org/wiki/One_Thousand_and_One_Nights
",288,One Thousand and One Nights,1200
Unknown,Iceland,images/njals-saga.jpg,Old Norse,"https://en.wikipedia.org/wiki/Nj%C3%A1ls_saga
",384,Njál's Saga,1350
Jane Austen,United Kingdom,images/pride-and-prejudice.jpg,English,"https://en.wikipedia.org/wiki/Pride_and_Prejudice
",226,Pride and Prejudice,1813
Honoré de Balzac,France,images/le-pere-goriot.jpg,French,"https://en.wikipedia.org/wiki/Le_P%C3%A8re_Goriot
",443,Le Père Goriot,1835
Samuel Beckett,Republic of Ireland,images/molloy-malone-dies-the-unnamable.jpg,"French, English","https://en.wikipedia.org/wiki/Molloy_(novel)↵
",256,"Molloy, Malone Dies, The Unnamable, the trilogy",1952
Giovanni Boccaccio,Italy,images/the-decameron.jpg,Italian,"https://en.wikipedia.org/wiki/The_Decameron
",1024,The Decameron,1351
Jorge Luis Borges,Argentina,images/ficciones.jpg,Spanish,"https://en.wikipedia.org/wiki/Ficciones
",224,Ficciones,1965
... (truncated)
TSV
chars: 14,057 tokens: 4,883 chars_og/tok: 5.7 enc_chars/tok: 2.9
author country imageLink language link pages titleyear
Chinua Achebe Nigeriaimages/things-fall-apart.jpgEnglish"https://en.wikipedia.org/wiki/Things_Fall_Apart
"209Things Fall Apart1958
Hans Christian Andersen Denmarkimages/fairy-tales.jpg Danish"https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.↵
"784 Fairy tales1836
Dante Alighieri Italyimages/the-divine-comedy.jpg Italian"https://en.wikipedia.org/wiki/Divine_Comedy
"928 The Divine Comedy1315
Unknown Sumer and Akkadian Empireimages/the-epic-of-gilgamesh.jpg Akkadian"https://en.wikipedia.org/wiki/Epic_of_Gilgamesh
"160 The Epic Of Gilgamesh-1700
Unknown Achaemenid Empireimages/the-book-of-job.jpgHebrew"https://en.wikipedia.org/wiki/Book_of_Job
"176 The Book Of Job-600
UnknownIndia/Iran/Iraq/Egypt/Tajikistanimages/one-thousand-and-one-nights.jpgArabic"https://en.wikipedia.org/wiki/One_Thousand_and_One_Nights
"288One Thousand and One Nights1200
Unknown Icelandimages/njals-saga.jpgOld Norse"https://en.wikipedia.org/wiki/Nj%C3%A1ls_saga
"384 Njál's Saga1350
Jane AustenUnited Kingdomimages/pride-and-prejudice.jpgEnglish"https://en.wikipedia.org/wiki/Pride_and_Prejudice
"226 Pride and Prejudice1813
Honoré de Balzac Franceimages/le-pere-goriot.jpg French"https://en.wikipedia.org/wiki/Le_P%C3%A8re_Goriot
"443Le Père Goriot1835
Samuel BeckettRepublic of Irelandimages/molloy-malone-dies-the-unnamable.jpg French, English"https://en.wikipedia.org/wiki/Molloy_(novel)↵
"256 Molloy, Malone Dies, The Unnamable, the trilogy1952
Giovanni Boccaccio Italyimages/the-decameron.jpg Italian"https://en.wikipedia.org/wiki/The_Decameron
"1024 The Decameron1351
Jorge Luis BorgesArgentinaimages/ficciones.jpg Spanish"https://en.wikipedia.org/wiki/Ficciones
"224 Ficciones1965
... (truncated)
YAML
chars: 22,400 tokens: 7,605 chars_og/tok: 3.7 enc_chars/tok: 2.9
- author: Chinua Achebe
· country: Nigeria
· imageLink: images/things-fall-apart.jpg
· language: English
· link: 'https://en.wikipedia.org/wiki/Things_Fall_Apart↵↵
··· '↵
· pages:·209
· title: Things Fall Apart
· year:·1958
- author: Hans Christian Andersen
· country: Denmark
· imageLink: images/fairy-tales.jpg
· language: Danish
· link: 'https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.↵↵
··· '↵
· pages:·784
· title: Fairy tales
· year:·1836
- author: Dante Alighieri
· country: Italy
· imageLink: images/the-divine-comedy.jpg
· language: Italian
· link: 'https://en.wikipedia.org/wiki/Divine_Comedy
... (truncated)
TOON
chars: 14,277 tokens: 4,866 chars_og/tok: 5.7 enc_chars/tok: 2.9
[100]{author,country,imageLink,language,link,pages,title,year}:↵
· Chinua Achebe,Nigeria,images/things-fall-apart.jpg,English,"https://en.wikipedia.org/wiki/Things_Fall_Apart\n",209,Things Fall Apart,1958
· Hans Christian Andersen,Denmark,images/fairy-tales.jpg,Danish,"https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.\n",784,Fairy tales,1836
· Dante Alighieri,Italy,images/the-divine-comedy.jpg,Italian,"https://en.wikipedia.org/wiki/Divine_Comedy\n",928,The Divine Comedy,1315
· Unknown,Sumer and Akkadian Empire,images/the-epic-of-gilgamesh.jpg,Akkadian,"https://en.wikipedia.org/wiki/Epic_of_Gilgamesh\n",160,The Epic Of Gilgamesh,-1700
· Unknown,Achaemenid Empire,images/the-book-of-job.jpg,Hebrew,"https://en.wikipedia.org/wiki/Book_of_Job\n",176,The Book Of Job,-600
· Unknown,India/Iran/Iraq/Egypt/Tajikistan,images/one-thousand-and-one-nights.jpg,Arabic,"https://en.wikipedia.org/wiki/One_Thousand_and_One_Nights\n",288,One Thousand and One Nights,1200
· Unknown,Iceland,images/njals-saga.jpg,Old Norse,"https://en.wikipedia.org/wiki/Nj%C3%A1ls_saga\n",384,Njál's Saga,1350
· Jane Austen,United Kingdom,images/pride-and-prejudice.jpg,English,"https://en.wikipedia.org/wiki/Pride_and_Prejudice\n",226,Pride and Prejudice,1813
· Honoré de Balzac,France,images/le-pere-goriot.jpg,French,"https://en.wikipedia.org/wiki/Le_P%C3%A8re_Goriot\n",443,Le Père Goriot,1835
· Samuel Beckett,Republic of Ireland,images/molloy-malone-dies-the-unnamable.jpg,"French, English","https://en.wikipedia.org/wiki/Molloy_(novel)\n",256,"Molloy, Malone Dies, The Unnamable, the trilogy",1952
· Giovanni Boccaccio,Italy,images/the-decameron.jpg,Italian,"https://en.wikipedia.org/wiki/The_Decameron\n",1024,The Decameron,1351
· Jorge Luis Borges,Argentina,images/ficciones.jpg,Spanish,"https://en.wikipedia.org/wiki/Ficciones\n",224,Ficciones,1965
· Emily Brontë,United Kingdom,images/wuthering-heights.jpg,English,"https://en.wikipedia.org/wiki/Wuthering_Heights\n",342,Wuthering Heights,1847
· Albert Camus,"Algeria, French Empire",images/l-etranger.jpg,French,"https://en.wikipedia.org/wiki/The_Stranger_(novel)\n",185,The Stranger,1942
· Paul Celan,"Romania, France",images/poems-paul-celan.jpg,German,"\n",320,Poems,1952
· Louis-Ferdinand Céline,France,images/voyage-au-bout-de-la-nuit.jpg,French,"https://en.wikipedia.org/wiki/Journey_to_the_End_of_the_Night\n",505,Journey to the End of the Night,1932
· Miguel de Cervantes,Spain,images/don-quijote-de-la-mancha.jpg,Spanish,"https://en.wikipedia.org/wiki/Don_Quixote\n",1056,Don Quijote De La Mancha,1610
· Geoffrey Chaucer,England,images/the-canterbury-tales.jpg,English,"https://en.wikipedia.org/wiki/The_Canterbury_Tales\n",544,The Canterbury Tales,1450
· Anton Chekhov,Russia,images/stories-of-anton-chekhov.jpg,Russian,"https://en.wikipedia.org/wiki/List_of_short_stories_by_Anton_Chekhov\n",194,Stories,1886
· Joseph Conrad,United Kingdom,images/nostromo.jpg,English,"https://en.wikipedia.org/wiki/Nostromo\n",320,Nostromo,1904
· Charles Dickens,United Kingdom,images/great-expectations.jpg,English,"https://en.wikipedia.org/wiki/Great_Expectations\n",194,Great Expectations,1861
· Denis Diderot,France,images/jacques-the-fatalist.jpg,French,"https://en.wikipedia.org/wiki/Jacques_the_Fatalist\n",596,Jacques the Fatalist,1796
· Alfred Döblin,Germany,images/berlin-alexanderplatz.jpg,German,"https://en.wikipedia.org/wiki/Berlin_Alexanderplatz\n",600,Berlin Alexanderplatz,1929
· Fyodor Dostoevsky,Russia,images/crime-and-punishment.jpg,Russian,"https://en.wikipedia.org/wiki/Crime_and_Punishment\n",551,Crime and Punishment,1866
... (truncated)
TSON
chars: 14,448 tokens: 4,845 chars_og/tok: 5.8 enc_chars/tok: 3.0
{@author,country,imageLink,language,link,pages,title,year#100|"Chinua Achebe",Nigeria,images/things-fall-apart.jpg,English,"https://en.wikipedia.org/wiki/Things_Fall_Apart\n",209,"Things Fall Apart",1958|"Hans Christian Andersen",Denmark,images/fairy-tales.jpg,Danish,"https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.\n",784,"Fairy tales",1836|"Dante Alighieri",Italy,images/the-divine-comedy.jpg,Italian,"https://en.wikipedia.org/wiki/Divine_Comedy\n",928,"The Divine Comedy",1315|Unknown,"Sumer and Akkadian Empire",images/the-epic-of-gilgamesh.jpg,Akkadian,"https://en.wikipedia.org/wiki/Epic_of_Gilgamesh\n",160,"The Epic Of Gilgamesh",-1700|Unknown,"Achaemenid Empire",images/the-book-of-job.jpg,Hebrew,"https://en.wikipedia.org/wiki/Book_of_Job\n",176,"The Book Of Job",-600|Unknown,India/Iran/Iraq/Egypt/Tajikistan,images/one-thousand-and-one-nights.jpg,Arabic,"https://en.wikipedia.org/wiki/One_Thousand_and_One_Nights\n",288,"One Thousand and One Nights",1200|Unknown,Iceland,images/njals-saga.jpg,"Old Norse","https://en.wikipedia.org/wiki/Nj%C3%A1ls_saga\n",384,"Njál's Saga",1350|"Jane Austen","United Kingdom",images/pride-and-prejudice.jpg,English,"https://en.wikipedia.org/wiki/Pride_and_Prejudice\n",226,"Pride and Prejudice",1813|"Honoré de Balzac",France,images/le-pere-goriot.jpg,French,"https://en.wikipedia.org/wiki/Le_P%C3%A8re_Goriot\n",443,"Le Père Goriot",1835|"Samuel Beckett","Republic of Ireland",images/molloy-malone-dies-the-unnamable.jpg,"French, English","https://en.wikipedia.org/wiki/Molloy_(novel)\n",256,"Molloy, Malone Dies, The Unnamable, the trilogy",1952|"Giovanni Boccaccio",Italy,images/the-decameron.jpg,Italian,"https://en.wikipedia.org/wiki/The_Decameron\n",1024,"The Decameron",1351|"Jorge Luis Borges",Argentina,images/ficciones.jpg,Spanish,"https://en.wikipedia.org/wiki/Ficciones\n",224,Ficciones,1965|"Emily Brontë","United Kingdom",images/wuthering-heights.jpg,English,"https://en.wikipedia.org/wiki/Wuthering_Heights\n",342,"Wuthering Heights",1847|"Albert Camus","Algeria, French Empire",images/l-etranger.jpg,French,"https://en.wikipedia.org/wiki/The_Stranger_(novel)\n",185,"The Stranger",1942|"Paul Celan","Romania, France",images/poems-paul-celan.jpg,German,"\n",320,Poems,1952|"Louis-Ferdinand Céline",France,images/voyage-au-bout-de-la-nuit.jpg,French,"https://en.wikipedia.org/wiki/Journey_to_the_End_of_the_Night\n",505,"Journey to the End of the Night",1932|"Miguel de Cervantes",Spain,images/don-quijote-de-la-mancha.jpg,Spanish,"https://en.wikipedia.org/wiki/Don_Quixote\n",1056,"Don Quijote De La Mancha",1610|"Geoffrey Chaucer",England,images/the-canterbury-tales.jpg,English,"https://en.wikipedia.org/wiki/The_Canterbury_Tales\n",544,"The Canterbury Tales",1450|"Anton Chekhov",Russia,images/stories-of-anton-chekhov.jpg,Russian,"https://en.wikipedia.org/wiki/List_of_short_stories_by_Anton_Chekhov\n",194,Stories,1886|"Joseph Conrad","United Kingdom",images/nostromo.jpg,English,"https://en.wikipedia.org/wiki/Nostromo\n",320,Nostromo,1904|"Charles Dickens","United Kingdom",images/great-expectations.jpg,English,"https://en.wikipedia.org/wiki/Great_Expectations\n",194,"Great Expectations",1861|"Denis Diderot",France,images/jacques-the-fatalist.jpg,French,"https://en.wikipedia.org/wiki/Jacques_the_Fatalist\n",596,"Jacques the Fatalist",1796|"Alfred Döblin",Germany,images/berlin-alexanderplatz.jpg,German,"https://en.wikipedia.org/wiki/Berlin_Alexanderplatz\n",600,"Berlin Alexanderplatz",1929|"Fyodor Dostoevsky",Russia,images/crime-and-punishment.jpg,Russian,"https://en.wikipedia.org/wiki/Crime_and_Punishment\n",551,"Crime and Punishment",1866|"Fyodor Dostoevsky",Russia,images/the-idiot.jpg,Russian,"https://en.wikipedia.org/wiki/The_Idiot\n",656,"The Idiot",1869|"Fyodor Dostoevsky",Russia,images/the-possessed.jpg,Russian,"https://en.wikipedia.org/wiki/Demons_(Dostoyevsky_novel)\n",768,"The Possessed",1872|"Fyodor Dostoevsky",Russia,images/the-brothers-karamazov.jpg,Russian,"https://en.wikipedia.org/wiki/The_Brothers_Karamazov\n",824,"The Brothers Karamazov",1880|"George Eliot","United Kingdom",images/middlemarch.jpg,English,"https://en.wikipedia.org/wiki/Middlemarch\n",800,Middlemarch,1871|"Ralph Ellison","United States",images/invisible-man.jpg,English,"https://en.wikipedia.org/wiki/Invisible_Man\n",581,"Invisible Man",1952|Euripides,Greece,images/medea.jpg,Greek,"https://en.wikipedia.org/wiki/Medea_(play)\n",104,Medea,-431|"William Faulkner","United States",images/absalom-absalom.jpg,English,"https://en.wikipedia.org/wiki/Absalom,_Absalom!\n",313,"Absalom, Absalom!",1936|"William Faulkner","United States",images/the-sound-and-the-fury.jpg,English,"https://en.wikipedia.org/wiki/The_Sound_and_the_Fury\n",326,"The Sound and the Fury",1929|"Gustave Flaubert",France,images/madame-bovary.jpg,French,"https://en.wikipedia.org/wiki/Madame_Bovary\n",528,"Madame Bovary",1857|"Gustave Flaubert",France,images/l-education-sentimentale.jpg,French,"https://en.wikipedia.org/wiki/Sen
... (truncated)
minemizer
chars: 14,458 tokens: 4,976 chars_og/tok: 5.6 enc_chars/tok: 2.9
author; country; imageLink; language; link; pages; title; year
Chinua Achebe; Nigeria; images/things-fall-apart.jpg; English; https://en.wikipedia.org/wiki/Things_Fall_Apart
;·209; Things Fall Apart;·1958
Hans Christian Andersen; Denmark; images/fairy-tales.jpg; Danish; https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.↵
;·784; Fairy tales;·1836
Dante Alighieri; Italy; images/the-divine-comedy.jpg; Italian; https://en.wikipedia.org/wiki/Divine_Comedy
;·928; The Divine Comedy;·1315
Unknown; Sumer and Akkadian Empire; images/the-epic-of-gilgamesh.jpg; Akkadian; https://en.wikipedia.org/wiki/Epic_of_Gilgamesh
;·160; The Epic Of Gilgamesh; -1700
Unknown; Achaemenid Empire; images/the-book-of-job.jpg; Hebrew; https://en.wikipedia.org/wiki/Book_of_Job
;·176; The Book Of Job; -600
Unknown; India/Iran/Iraq/Egypt/Tajikistan; images/one-thousand-and-one-nights.jpg; Arabic; https://en.wikipedia.org/wiki/One_Thousand_and_One_Nights
;·288; One Thousand and One Nights;·1200
Unknown; Iceland; images/njals-saga.jpg; Old Norse; https://en.wikipedia.org/wiki/Nj%C3%A1ls_saga
;·384; Njál's Saga;·1350
Jane Austen; United Kingdom; images/pride-and-prejudice.jpg; English; https://en.wikipedia.org/wiki/Pride_and_Prejudice
;·226; Pride and Prejudice;·1813
Honoré de Balzac; France; images/le-pere-goriot.jpg; French; https://en.wikipedia.org/wiki/Le_P%C3%A8re_Goriot
;·443; Le Père Goriot;·1835
Samuel Beckett; Republic of Ireland; images/molloy-malone-dies-the-unnamable.jpg; French, English; https://en.wikipedia.org/wiki/Molloy_(novel)↵
;·256; Molloy, Malone Dies, The Unnamable, the trilogy;·1952
Giovanni Boccaccio; Italy; images/the-decameron.jpg; Italian; https://en.wikipedia.org/wiki/The_Decameron
;·1024; The Decameron;·1351
Jorge Luis Borges; Argentina; images/ficciones.jpg; Spanish; https://en.wikipedia.org/wiki/Ficciones
;·224; Ficciones;·1965
... (truncated)
minemizer (compact)
chars: 13,753 tokens: 4,847 chars_og/tok: 5.8 enc_chars/tok: 2.8
author;country;imageLink;language;link;pages;title;year
Chinua Achebe;Nigeria;images/things-fall-apart.jpg;English;https://en.wikipedia.org/wiki/Things_Fall_Apart
;209;Things Fall Apart;1958
Hans Christian Andersen;Denmark;images/fairy-tales.jpg;Danish;https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.↵
;784;Fairy tales;1836
Dante Alighieri;Italy;images/the-divine-comedy.jpg;Italian;https://en.wikipedia.org/wiki/Divine_Comedy
;928;The Divine Comedy;1315
Unknown;Sumer and Akkadian Empire;images/the-epic-of-gilgamesh.jpg;Akkadian;https://en.wikipedia.org/wiki/Epic_of_Gilgamesh
;160;The Epic Of Gilgamesh;-1700
Unknown;Achaemenid Empire;images/the-book-of-job.jpg;Hebrew;https://en.wikipedia.org/wiki/Book_of_Job
;176;The Book Of Job;-600
Unknown;India/Iran/Iraq/Egypt/Tajikistan;images/one-thousand-and-one-nights.jpg;Arabic;https://en.wikipedia.org/wiki/One_Thousand_and_One_Nights
;288;One Thousand and One Nights;1200
Unknown;Iceland;images/njals-saga.jpg;Old Norse;https://en.wikipedia.org/wiki/Nj%C3%A1ls_saga
;384;Njál's Saga;1350
Jane Austen;United Kingdom;images/pride-and-prejudice.jpg;English;https://en.wikipedia.org/wiki/Pride_and_Prejudice
;226;Pride and Prejudice;1813
Honoré de Balzac;France;images/le-pere-goriot.jpg;French;https://en.wikipedia.org/wiki/Le_P%C3%A8re_Goriot
;443;Le Père Goriot;1835
Samuel Beckett;Republic of Ireland;images/molloy-malone-dies-the-unnamable.jpg;French, English;https://en.wikipedia.org/wiki/Molloy_(novel)↵
;256;Molloy, Malone Dies, The Unnamable, the trilogy;1952
Giovanni Boccaccio;Italy;images/the-decameron.jpg;Italian;https://en.wikipedia.org/wiki/The_Decameron
;1024;The Decameron;1351
Jorge Luis Borges;Argentina;images/ficciones.jpg;Spanish;https://en.wikipedia.org/wiki/Ficciones
;224;Ficciones;1965
... (truncated)
countries.json — Original: 1133948 chars — Tokenizer: qwen2.5 (Qwen/Qwen2.5-0.5B)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)1,133,948474,0142.42.4
JSON (min)787,962365,0373.12.2
CSVN/A
TSVN/A
YAML641,939219,2695.22.9
TOON691,140215,4505.33.2
TSON423,383158,3497.22.7
minemizer323,130133,6728.52.4
minemizer (compact)299,485133,5978.52.2
JSON (pretty)
chars: 1,133,948 tokens: 474,014 chars_og/tok: 2.4 enc_chars/tok: 2.4
[↵
· {↵
··· "name": {↵
····· "common": "Aruba",↵
····· "official": "Aruba",↵
····· "native": {↵
······· "nld": {↵
········· "official": "Aruba",↵
········· "common": "Aruba"↵
······· },↵
······· "pap": {↵
········· "official": "Aruba",↵
········· "common": "Aruba"↵
······· }↵
····· }↵
··· },↵
··· "tld": [↵
····· ".aw"↵
··· ],↵
··· "cca2": "AW",↵
··· "ccn3": "533",↵
··· "cca3": "ABW",↵
··· "cioc": "ARU",↵
··· "independent": false,↵
··· "status": "officially-assigned",
... (truncated)
JSON (min)
chars: 787,962 tokens: 365,037 chars_og/tok: 3.1 enc_chars/tok: 2.2
[{"name":{"common":"Aruba","official":"Aruba","native":{"nld":{"official":"Aruba","common":"Aruba"},"pap":{"official":"Aruba","common":"Aruba"}}},"tld":[".aw"],"cca2":"AW","ccn3":"533","cca3":"ABW","cioc":"ARU","independent":false,"status":"officially-assigned","unMember":false,"unRegionalGroup":"","currencies":{"AWG":{"name":"Aruban florin","symbol":"\u0192"}},"idd":{"root":"+2","suffixes":["97"]},"capital":["Oranjestad"],"altSpellings":["AW"],"region":"Americas","subregion":"Caribbean","languages":{"nld":"Dutch","pap":"Papiamento"},"translations":{"ara":{"official":"\u0623\u0631\u0648\u0628\u0627","common":"\u0623\u0631\u0648\u0628\u0627"},"bre":{"official":"Aruba","common":"Aruba"},"ces":{"official":"Aruba","common":"Aruba"},"deu":{"official":"Aruba","common":"Aruba"},"est":{"official":"Aruba","common":"Aruba"},"fin":{"official":"Aruba","common":"Aruba"},"fra":{"official":"Aruba","common":"Aruba"},"hrv":{"official":"Aruba","common":"Aruba"},"hun":{"official":"Aruba","common":"Aruba"},"ita":{"official":"Aruba","common":"Aruba"},"jpn":{"official":"\u30a2\u30eb\u30d0","common":"\u30a2\u30eb\u30d0"},"kor":{"official":"\uc544\ub8e8\ubc14","common":"\uc544\ub8e8\ubc14"},"nld":{"official":"Aruba","common":"Aruba"},"per":{"official":"\u0622\u0631\u0648\u0628\u0627","common":"\u0622\u0631\u0648\u0628\u0627"},"pol":{"official":"Aruba","common":"Aruba"},"por":{"official":"Aruba","common":"Aruba"},"rus":{"official":"\u0410\u0440\u0443\u0431\u0430","common":"\u0410\u0440\u0443\u0431\u0430"},"slk":{"official":"Aruba","common":"Aruba"},"spa":{"official":"Aruba","common":"Aruba"},"srp":{"official":"Aruba","common":"Aruba"},"swe":{"official":"Aruba","common":"Aruba"},"tur":{"official":"Aruba","common":"Aruba"},"urd":{"official":"\u0627\u0631\u0648\u0628\u0627","common":"\u0627\u0631\u0648\u0628\u0627"},"zho":{"official":"\u963f\u9c81\u5df4","common":"\u963f\u9c81\u5df4"}},"latlng":[12.5,-69.96666666],"landlocked":false,"borders":[],"area":180,"flag":"\ud83c\udde6\ud83c\uddfc","demonyms":{"eng":{"f":"Aruban","m":"Aruban"},"fra":{"f":"Arubaise","m":"Arubais"}}},{"name":{"common":"Afghanistan","official":"Islamic Republic of Afghanistan","native":{"prs":{"official":"\u062c\u0645\u0647\u0648\u0631\u06cc \u0627\u0633\u0644\u0627\u0645\u06cc \u0627\u0641\u063a\u0627\u0646\u0633\u062a\u0627\u0646","common":"\u0627\u0641\u063a\u0627\u0646\u0633\u062a\u0627\u0646"},"pus":{"official":"\u062f \u0627\u0641\u063a\u0627\u0646\u0633\u062a\u0627\u0646 \u0627\u0633\u0644\u0627\u0645\u064a \u062c\u0645\u0647\u0648\u0631\u06cc\u062a","common":"\u0627\u0641\u063a\u0627\u0646\u0633\u062a\u0627\u0646"},"tuk":{"official":"Owganystan Yslam Respublikasy","common":"Owganystan"}}},"tld":[".af"],"cca2":"AF","ccn3":"004","cca3":"AFG","cioc":"AFG","independent":true,"status":"officially-assigned","unMember":true,"unRegionalGroup":"Asia and the Pacific Group","currencies":{"AFN":{"name":"Afghan afghani","symbol":"\u060b"}},"idd":{"root":"+9","suffixes":["3"]},"capital":["Kabul"],"altSpellings":["AF","Af\u0121\u0101nist\u0101n"],"region":"Asia","subregion":"Southern Asia","languages":{"prs":"Dari","pus":"Pashto","tuk":"Turkmen"},"translations":{"ara":{"official":"\u062c\u0645\u0647\u0648\u0631\u064a\u0629 \u0623\u0641\u0641\u0627\u0646\u0633\u062a\u0627\u0646 \u0627\u0644\u0625\u0633\u0644\u0627\u0645\u064a\u0629","common":"\u0623\u0641\u063a\u0627\u0646\u0633\u062a\u0627\u0646"},"bre":{"official":"Republik Islamek Afghanistan","common":"Afghanistan"},"ces":{"official":"Afgh\u00e1nsk\u00e1 isl\u00e1msk\u00e1 republika","common":"Afgh\u00e1nist\u00e1n"},"deu":{"official":"Islamische Republik Afghanistan","common":"Afghanistan"},"est":{"official":"Afganistani Islamivabariik","common":"Afganistan"},"fin":{"official":"Afganistanin islamilainen tasavalta","common":"Afganistan"},"fra":{"official":"R\u00e9publique islamique d'Afghanistan","common":"Afghanistan"},"hrv":{"official":"Islamska Republika Afganistan","common":"Afganistan"},"hun":{"official":"Afganiszt\u00e1ni Iszl\u00e1m K\u00f6zt\u00e1rsas\u00e1g","common":"Afganiszt\u00e1n"},"ita":{"official":"Repubblica islamica dell'Afghanistan","common":"Afghanistan"},"jpn":{"official":"\u30a2\u30d5\u30ac\u30cb\u30b9\u30bf\u30f3\u30fb\u30a4\u30b9\u30e9\u30e0\u5171\u548c\u56fd","common":"\u30a2\u30d5\u30ac\u30cb\u30b9\u30bf\u30f3"},"kor":{"official":"\uc544\ud504\uac00\ub2c8\uc2a4\ud0c4 \uc774\uc2ac\ub78c \uacf5\ud654\uad6d","common":"\uc544\ud504\uac00\ub2c8\uc2a4\ud0c4"},"nld":{"official":"Islamitische Republiek Afghanistan","common":"Afghanistan"},"per":{"official":"\u062c\u0645\u0647\u0648\u0631\u06cc \u0627\u0633\u0644\u0627\u0645\u06cc \u0627\u0641\u063a\u0627\u0646\u0633\u062a\u0627\u0646","common":"\u0627\u0641\u063a\u0627\u0646\u0633\u062a\u0627\u0646"},"pol":{"official":"Islamska Republika Afganistanu","common":"Afganistan"},"por":{"official":"Rep\u00fablica Isl\u00e2mica do Afeganist\u00e3o","common":"Afeganist\u00e3o"},"rus":{"official":"\u0418\u0441\u043b\u0430\u043c\u0441\u043a\u0430\u044f \u0420\
... (truncated)
CSV: N/A
TSV: N/A
YAML
chars: 641,939 tokens: 219,269 chars_og/tok: 5.2 enc_chars/tok: 2.9
- altSpellings:↵
· - AW
· area:·180
· borders: []↵
· capital:↵
· - Oranjestad
· cca2: AW
· cca3: ABW
· ccn3: '533'↵
· cioc: ARU
· currencies:↵
··· AWG:↵
····· name: Aruban florin
····· symbol:·ƒ
· demonyms:↵
··· eng:↵
····· f: Aruban
····· m: Aruban
··· fra:↵
····· f: Arubaise
····· m: Arubais
· flag:🇼
· idd:↵
··· root: '+2'↵
··· suffixes:
... (truncated)
TOON
chars: 691,140 tokens: 215,450 chars_og/tok: 5.3 enc_chars/tok: 3.2
[250]:↵
· -↵
··· name:↵
····· common: Aruba
····· official: Aruba
····· native:↵
······· nld:↵
········· official: Aruba
········· common: Aruba
······· pap:↵
········· official: Aruba
········· common: Aruba
··· tld[1]: .aw
··· cca2: AW
··· ccn3: "533"↵
··· cca3: ABW
··· cioc: ARU
··· independent: false
··· status: officially-assigned
··· unMember: false
··· unRegionalGroup: ""↵
··· currencies:↵
····· AWG:↵
······· name: Aruban florin
······· symbol:·ƒ
... (truncated)
TSON
chars: 423,383 tokens: 158,349 chars_og/tok: 7.2 enc_chars/tok: 2.7
{@name(@common,official,native),tld,cca2,ccn3,cca3,cioc,independent,status,unMember,unRegionalGroup,currencies,idd(@root,suffixes),capital,altSpellings,region,subregion,languages,translations(@ara,bre,ces,deu,est,fin,fra,hrv,hun,ita,jpn,kor,nld,per,pol,por,rus,slk,spa,srp,swe,tur,urd,zho),latlng,landlocked,borders,area,flag,demonyms(@eng,fra)#250|{Aruba,Aruba,{@nld,pap|{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba}}},[.aw],AW,"533",ABW,ARU,false,officially-assigned,false,"",{@AWG|{@name,symbol|"Aruban florin",ƒ}},{"+2",["97"]},[Oranjestad],[AW],Americas,Caribbean,{@nld,pap|Dutch,Papiamento},{{@official,common|أروبا,أروبا},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|アルバ,アルバ},{@official,common|,},{@official,common|Aruba,Aruba},{@official,common|آروبا,آروبا},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Аруба,Аруба},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|اروبا,اروبا},{@official,common|,}},[12.5,-69.96666666],false,[],180,🇦🇼,{{@f,m|Aruban,Aruban},{@f,m|Arubaise,Arubais}}|{Afghanistan,"Islamic Republic of Afghanistan",{@prs,pus,tuk|{@official,common|"جمهوری اسلامی افغانستان",افغانستان},{@official,common|"د افغانستان اسلامي جمهوریت",افغانستان},{@official,common|"Owganystan Yslam Respublikasy",Owganystan}}},[.af],AF,"004",AFG,AFG,true,officially-assigned,true,"Asia and the Pacific Group",{@AFN|{@name,symbol|"Afghan afghani",}},{"+9",["3"]},[Kabul],[AF,Afġānistān],Asia,"Southern Asia",{@prs,pus,tuk|Dari,Pashto,Turkmen},{{@official,common|"جمهورية أففانستان الإسلامية",أفغانستان},{@official,common|"Republik Islamek Afghanistan",Afghanistan},{@official,common|"Afghánská islámská republika",Afghánistán},{@official,common|"Islamische Republik Afghanistan",Afghanistan},{@official,common|"Afganistani Islamivabariik",Afganistan},{@official,common|"Afganistanin islamilainen tasavalta",Afganistan},{@official,common|"publique islamique d'Afghanistan",Afghanistan},{@official,common|"Islamska Republika Afganistan",Afganistan},{@official,common|"Afganisztáni Iszlámztársaság",Afganisztán},{@official,common|"Repubblica islamica dell'Afghanistan",Afghanistan},{@official,common|フ�スタンイス共和国,フ�スタン},{@official,common|"",},{@official,common|"Islamitische Republiek Afghanistan",Afghanistan},{@official,common|"جمهوری اسلامی افغانستان",افغانستان},{@official,common|"Islamska Republika Afganistanu",Afganistan},{@official,common|"República Islâmica do Afeganistão",Afeganistão},{@official,common|"Исламская Республика Афганистан",Афганистан},{@official,common|"Afgánsky islamský štát",Afganistan},{@official,common|"República Islámica de Afganistán",Afganistán},{@official,common|"Islamska Republika Avganistan",Avganistan},{@official,common|"Islamiska republiken Afghanistan",Afghanistan},{@official,common|"Afganistan İslam Cumhuriyeti",Afganistan},{@official,common|"اسلامی جمہوریہ افغانستان",افغانستان},{@official,common|阿富汗伊斯兰共和国,阿富汗}},[33,65],true,[IRN,PAK,TKM,UZB,TJK,CHN],652230,🇦🇫,{{@f,m|Afghan,Afghan},{@f,m|Afghane,Afghan}}|{Angola,"Republic of Angola",{@por|{@official,common|"República de Angola",Angola}}},[.ao],AO,"024",AGO,ANG,true,officially-assigned,true,"African Group",{@AOA|{@name,symbol|"Angolan kwanza",Kz}},{"+2",["44"]},[Luanda],[AO,"República de Angola","ʁɛpublika de an'ɡɔla"],Africa,"Middle Africa",{@por|Portuguese},{{@official,common|أنغولا,"جمهورية أنغولا"},{@official,common|"Republik Angola",Angola},{@official,common|"Angolská republika",Angola},{@official,common|"Republik Angola",Angola},{@official,common|"Angola Vabariik",Angola},{@official,common|"Angolan tasavalta",Angola},{@official,common|"publique d'Angola",Angola},{@official,common|"Republika Angola",Angola},{@official,common|Angola,Angola},{@official,common|"Repubblica dell'Angola",Angola},{@official,common|アン共和国,アン},{@official,common|"",},{@official,common|"Republiek Angola",Angola},{@official,common|"جمهوری آنگولا",آنگولا},{@official,common|"Republika Angoli",Angola},{@official,common|"República de Angola",Angola},{@official,common|"Республика Ангола",Ангола},{@official,common|"Angolská republika",Angola},{@official,common|"República de Angola",Angola},{@official,common|"Republika Angola",Angola},{@official,common|"Republiken Angola",Angola},{@official,common|"Angola Cumhuriyeti",Angola},{@official,common|"جمہوریہ انگولہ",انگولہ},{@official,common|共和国,}},[-12.5,18.5],false,[COG,COD,ZMB,NAM],1246700,🇦🇴,{{@f,m|Angolan,Angolan},{@f,m|Angolaise,Angolais}}|{Anguilla,Anguilla,{@eng|{@official,common|Anguilla,Anguilla}}},[.ai],AI,"660",AIA,"",false,officially-assigned,false,"",{@XCD
... (truncated)
minemizer
chars: 323,130 tokens: 133,672 chars_og/tok: 8.5 enc_chars/tok: 2.4
name{ common; official; native{ ...}}; tld[]; cca2; ccn3; cca3; cioc; independent; status; unMember; unRegionalGroup; currencies{ ...}; idd{ root; suffixes[]}; capital[]; altSpellings[]; region; subregion; languages{ ...}; translations{ ara{ official; common}; bre{ official; common}; ces{ official; common}; deu{ official; common}; est{ official; common}; fin{ official; common}; fra{ official; common}; hrv{ official; common}; hun{ official; common}; ita{ official; common}; jpn{ official; common}; kor{ official; common}; nld{ official; common}; per{ official; common}; pol{ official; common}; por{ official; common}; rus{ official; common}; slk{ official; common}; spa{ official; common}; srp{ official; common}; swe{ official; common}; tur{ official; common}; urd{ official; common}; zho{ official; common}}; latlng[]; landlocked; borders[]; area; flag; demonyms{ eng{ f; m}; fra{ f; m}}↵
{ Aruba; Aruba;{ nld:{ official: Aruba; common: Aruba}; pap:{ official: Aruba; common: Aruba}}};[ .aw]; AW;·533; ABW; ARU;false; officially-assigned;false;;{ AWG:{ name: Aruban florin; symbol:·ƒ}};{ +2;[·97]};[ Oranjestad];[ AW]; Americas; Caribbean;{ nld: Dutch; pap: Papiamento};{{ أروبا; أروبا};{ Aruba; Aruba};{ Aruba; Aruba};{ Aruba; Aruba};{ Aruba; Aruba};{ Aruba; Aruba};{ Aruba; Aruba};{ Aruba; Aruba};{ Aruba; Aruba};{ Aruba; Aruba};{;};{;};{ Aruba; Aruba};{ آروبا; آروبا};{ Aruba; Aruba};{ Aruba; Aruba};{ Аруба; Аруба};{ Aruba; Aruba};{ Aruba; Aruba};{ Aruba; Aruba};{ Aruba; Aruba};{ Aruba; Aruba};{ اروبا; اروبا};{;}};[·12.5; -69.96666666];false;[];·180;🇼;{{ Aruban; Aruban};{ Arubaise; Arubais}}↵
{ Afghanistan; Islamic Republic of Afghanistan;{ prs:{ official: جمهوری اسلامی افغانستان; common: افغانستان}; pus:{ official: د افغانستان اسلامي جمهوریت; common: افغانستان}; tuk:{ official: Owganystan Yslam Respublikasy; common: Owganystan}}};[ .af]; AF;·004; AFG; AFG;true; officially-assigned;true; Asia and the Pacific Group;{ AFN:{ name: Afghan afghani; symbol:}};{ +9;[·3]};[ Kabul];[ AF; Afġānistān]; Asia; Southern Asia;{ prs: Dari; pus: Pashto; tuk: Turkmen};{{ جمهورية أففانستان الإسلامية; أفغانستان};{ Republik Islamek Afghanistan; Afghanistan};{ Afghánská islámská republika; Afghánistán};{ Islamische Republik Afghanistan; Afghanistan};{ Afganistani Islamivabariik; Afganistan};{ Afganistanin islamilainen tasavalta; Afganistan};{publique islamique d'Afghanistan; Afghanistan};{ Islamska Republika Afganistan; Afganistan};{ Afganisztáni Iszlámztársaság; Afganisztán};{ Repubblica islamica dell'Afghanistan; Afghanistan};{フ�スタンイス共和国;フ�スタン};{;};{ Islamitische Republiek Afghanistan; Afghanistan};{ جمهوری اسلامی افغانستان; افغانستان};{ Islamska Republika Afganistanu; Afganistan};{ República Islâmica do Afeganistão; Afeganistão};{ Исламская Республика Афганистан; Афганистан};{ Afgánsky islamský štát; Afganistan};{ República Islámica de Afganistán; Afganistán};{ Islamska Republika Avganistan; Avganistan};{ Islamiska republiken Afghanistan; Afghanistan};{ Afganistan İslam Cumhuriyeti; Afganistan};{ اسلامی جمہوریہ افغانستان; افغانستان};{伊斯兰共和国;}};[·33;·65];true;[ IRN; PAK; TKM; UZB; TJK; CHN];·652230;🇫;{{ Afghan; Afghan};{ Afghane; Afghan}}↵
{ Angola; Republic of Angola;{ por:{ official: República de Angola; common: Angola}}};[ .ao]; AO;·024; AGO; ANG;true; officially-assigned;true; African Group;{ AOA:{ name: Angolan kwanza; symbol: Kz}};{ +2;[·44]};[ Luanda];[ AO; República de Angola;·ʁɛpublika de an'ɡɔla]; Africa; Middle Africa;{ por: Portuguese};{{ أنغولا; جمهورية أنغولا};{ Republik Angola; Angola};{ Angolská republika; Angola};{ Republik Angola; Angola};{ Angola Vabariik; Angola};{ Angolan tasavalta; Angola};{publique d'Angola; Angola};{ Republika Angola; Angola};{ Angola; Angola};{ Repubblica dell'Angola; Angola};{共和国;};{;};{ Republiek Angola; Angola};{ جمهوری آنگولا; آنگولا};{ Republika Angoli; Angola};{ República de Angola; Angola};{ Республика Ангола; Ангола};{ Angolská republika; Angola};{ República de Angola; Angola};{ Republika Angola; Angola};{ Republiken Angola; Angola};{ Angola Cumhuriyeti; Angola};{ جمہوریہ انگولہ; انگولہ};{共和国;}};[ -12.5;·18.5];false;[ COG; COD; ZMB; NAM];·1246700;🇴;{{ Angolan; Angolan};{ Angolaise; Angolais}}↵
{ Anguilla; Anguilla;{ eng:{ official: Anguilla; common: Anguilla}}};[ .ai]; AI;·660; AIA;;false; officially-assigned;false;;{ XCD:{ name: Eastern Caribbean dollar; symbol: $}};{ +1;[·264]};[ The Valley];[ AI]; Americas; Caribbean;{ eng: English};{{ أنغويلا; أنغويلا};{ Anguilla; Anguilla};{ Anguilla; Anguilla};{ Anguilla; Anguilla};{ Anguilla; Anguilla};{ Anguilla; Anguilla};{ Anguilla; Anguilla};{ Anguilla; Angvila};{ Anguilla; Anguilla};{ Anguilla; Anguilla};{;};{;};{ Anguilla; Anguilla};{ آنگویلا; آنگویلا};{ Anguilla; Anguilla};{ Anguilla; Anguilla};{ Ангилья; Ангилья};{ Anguilla; Anguilla};{ Anguila; Anguilla};{ Angvila; Angvila};{ Anguilla; Anguilla};{ Anguilla; Anguilla};{ اینگویلا; اینگویلا};{;}};[·18.25; -63.16666666];false;[];·91;🇮;{{ Anguillian; Anguillian};{ Anguillane; Anguillan}}↵
{ Åland Islands; Åland Islands;{ swe:{ official: Landskapet Åland; common: Åland}}};[ .ax]; AX;·248; ALA;;false; officially-assigned;false;;{ EUR:{ name: Euro; symbol:}};{ +3;[·5818]};[ Mariehamn];[ AX; Aaland; Aland; Ahvenanmaa]; Europe; Northern Europe;{ swe: Swedish};{{ جزر أولاند; جزر أولاند};{ Inizi Åland; Åland};{ Ålandské ostrovy; Ålandy};{ Åland-Inseln; Åland};{ Ahvenamaa maakond; Ahvenamaa};{ Ahvenanmaan maakunta; Ahvenanmaa};{ Ahvenanmaa; Ahvenanmaa};{ Aland Islands; Ålandski otoci};{ Åland-szigetek; Åland-szigetek};{ Isole Åland; Isole Aland};{ー�ンド;ー�ンド};{;};{ Åland eilanden; Ålandeilanden};{ جزایر الند; جزایر الند};{ Wyspy Alandzkie; Wyspy Alandzkie};{ Ilhas Åland; Alândia};{ Аландские острова; Аландские острова};{ Alandské ostrovy; Alandy};{ Islas Åland; Alandia};{ Olandska Ostrva; Olandska Ostrva};{ Åland; Åland};{ Åland Adaları; Åland};{ جزائر اولند; جزائر اولند};{群岛;群岛}};[·60.116667;·19.9];false;[];·1580;🇽;{{ Ålandish; Ålandish};{ Ålandaise; Ålandais}}↵
{ Albania; Republic of Albania;{ sqi:{ official: Republika e Shqipërisë; common: Shqipëria}}};[ .al]; AL;·008; ALB; ALB;true; officially-assigned;true; Eastern European Group;{ ALL:{ name: Albanian lek; symbol: L}};{ +3;[·55]};[ Tirana];[ AL; Shqipëri; Shqipëria; Shqipnia]; Europe; Southeast Europe;{ sqi: Albanian};{{ جمهورية ألبانيا; ألبانيا};{ Republik Albania; Albania};{ Albánská republika; Albánie};{ Republik Albanien; Albanien};{ Albaania Vabariik; Albaania};{ Albanian tasavalta; Albania};{publique d'Albanie; Albanie};{ Republika Albanija; Albanija};{ Albánztársaság; Albánia};{ Repubblica d'Albania; Albania};{ニア共和国;ニア};{;};{ Republiek Albanië; Albanië};{ جمهوری آلبانی; آلبانی};{ Republika Albanii; Albania};{ República da Albânia; Albânia};{ Республика Албания; Албания};{ Albánska republika; Albánsko};{ República de Albania; Albania};{ Republika Albanija; Albanija};{ Republiken Albanien; Albanien};{ Arnavutluk Cumhuriyeti; Arnavutluk};{ جمہوریہ البانیا; البانیا};{尼亚共和国;尼亚}};[·41;·20];false;[ MNE; GRC; MKD; UNK];·28748;🇱;{{ Albanian; Albanian};{ Albanaise; Albanais}}↵
{ Andorra; Principality of Andorra;{ cat:{ official: Principat d'Andorra; common: Andorra}}};[ .ad]; AD;·020; AND; AND;true; officially-assigned;true; Western European and Others Group;{ EUR:{ name: Euro; symbol:}};{ +3;[·76]};[ Andorra la Vella];[ AD; Principality of Andorra; Principat d'Andorra]; Europe; Southern Europe;{ cat: Catalan};{{ إمارة أندورا; أندورا};{ Priñselezh Andorra; Andorra};{ Andorrské knížect; Andorra};{ Fürstentum Andorra; Andorra};{ Andorra Vürstiriik; Andorra};{ Andorran ruhtinaskunta; Andorra};{ Principauté d'Andorre; Andorre};{ Kneževina Andora; Andora};{ Andorra; Andorra};{ Principato di Andorra; Andorra};{ンド;ンド};{;};{ Prinsdom Andorra; Andorra};{ شاهزادهنشین آندورا; آندورا};{ Księstwo Andory; Andora};{ Principado de Andorra; Andorra};{ Княжество Андорра; Андорра};{ Andorrské kniežatstvo; Andorra};{ Principado de Andorra; Andorra};{ Kneževina Andora; Andora};{ Furstendömet Andorra; Andorra};{ Andorra Prensliği; Andorra};{ اماراتِ انڈورا; انڈورا};{;}};[·42.5;·1.5];true;[ FRA; ESP];·468;🇩;{{ Andorran; Andorran};{ Andorrane; Andorran}}↵
{ United Arab Emirates; United Arab Emirates;{ ara:{ official: الإمارات العربية المتحدة; common: الإمارات}}};[ .ae; امارات.]; AE;·784; ARE; UAE;true; officially-assigned;true; Asia and the Pacific Group;{ AED:{ name: United Arab Emirates dirham; symbol: د.إ}};{ +9;[·71]};[ Abu Dhabi];[ AE; UAE; Emirates]; Asia; Western Asia;{ ara: Arabic};{{ الإمارات العربية المتحدة; الإمارات};{ Emirelezhioù Arab Unanet; Emirelezhioù Arab Unanet};{ Spojené arabské emiráty; Spojené arabské emiráty};{ Vereinigte Arabische Emirate; Vereinigte Arabische Emirate};{ Araabia Ühendemiraadid; Araabia Ühendemiraadid};{ Yhdistyneet arabiemiirikunnat; Arabiemiraatit};{ Émirats arabes unis; Émirats arabes unis};{ Ujedinjeni Arapski Emirati; Ujedinjeni Arapski Emirati};{ Egyesült Arab Emírségek; Egyesült Arab Emírségek};{ Emirati Arabi Uniti; Emirati Arabi Uniti};{; UAE};{����;};{ Verenigde Arabische Emiraten; Verenigde Arabische Emiraten};{ امارات متحده عربی; امارات};{ Zjednoczone Emiraty Arabskie; Zjednoczone Emiraty Arabskie};{ Emirados Árabes Unidos; Emirados Árabes Unidos};{ Объединенные Арабские Эмираты; Объединённые Арабские Эмираты};{ Spojené arabské emiráty; Spojené arabské emiráty};{ Emiratos Árabes Unidos; Emiratos Árabes Unidos};{ Ujedinjeni Arapski Emirati; Ujedinjeni Arapski Emirati};{ Förenade Arabemiraten; Förenade Arabemiraten};{ Birleşik Arap Emirlikleri; Birleşik Arap Emirlikleri};{ متحدہ عرب امارات; متحدہ عرب امارات};{联合;联合}};[·24;·54];false;[ OMN; SAU];·83600;🇪;{{ Emirati; Emirati};{ Emirienne; Emirien}}↵
{ Argentina; Argentine Republic;{ grn:{ official: Argentine Republic; common: Argentina}; spa:{ official: República Argentina; common: Argentina}}};[ .ar]; AR;·032; ARG; ARG;true; officially-assigned;true; Latin American and Caribbean Group;{ ARS:{ name: Argentine peso; symbol: $}};{ +5;[·4]};[ Buenos Aires];[ AR; Argentine Republic; República Argentina]; Americas; South America;{ grn: Guaraní; spa: Spanish};{{ جمهورية الأرجنتين; الأرجنتين};{ Republik Arc'hantina; Arc'hantina};{ Argentinská republika; Argentina};{ Argentinische Republik; Argentinien};{ Argentina Vabariik; Argentina};{ Argentiinan tasavalta; Argentiina};{publique argentine; Argentine};{ Argentinski Republika; Argentina};{ Argentinztársaság; Argentína};{ Repubblica Argentina; Argentina};{チン共和国;チン};{;};{ Argentijnse Republiek; Argentinië};{ جمهوری آرژانتین; آرژانتین};{ Republika Argentyńska; Argentyna};{ República Argentina; Argentina};{ Аргентинская Республика; Аргентина};{ Argentínska republika; Argentína};{ República Argentina; Argentina};{ Republika Argentina; Argentina};{ Republiken Argentina; Argentina};{ Arjantin Cumhuriyeti; Arjantin};{ جمہوریہ ارجنٹائن; ارجنٹائن};{共和国;}};[ -34; -64];false;[ BOL; BRA; CHL; PRY; URY];·2780400;🇷;{{ Argentine; Argentine};{ Argentine; Argentin}}↵
{ Armenia; Republic of Armenia;{ hye:{ official:·Հայաստանի·Հանրապետություն; common:·Հայաստան}}};[ .am]; AM;·051; ARM; ARM;true; officially-assigned;true; Eastern European Group;{ AMD:{ name: Armenian dram; symbol:·}};{ +3;[·74]};[ Yerevan];[ AM; Hayastan; Republic of Armenia;·Հայաստանի·Հանրապետություն]; Asia; Western Asia;{ hye: Armenian};{{ جمهورية أرمينيا; أرمينيا};{ Republik Armenia; Armenia};{ Arménská republika; Arménie};{ Republik Armenien; Armenien};{ Armeenia Vabariik; Armeenia};{ Armenian tasavalta; Armenia};{publique d'Arménie; Arménie};{ Republika Armenija; Armenija};{ Örményország; Örményország};{ Repubblica di Armenia; Armenia};{ニア共和国;ニア};{;};{ Republiek Armen; Armen};{ جمهوری ارمنستان; ارمنستان};{ Republika Armenii; Armenia};{ República da Arménia; Arménia};{ Республика Армения; Армения};{ Arménska republika; Arménsko};{ República de Armenia; Armenia};{ Republika Jermenija; Jermenija};{ Republiken Armenien; Armenien};{ Ermenistan Cumhuriyeti; Ermenistan};{ جمہوریہ آرمینیا; آرمینیا};{·尼亚共和国;·尼亚}};[·40;·45];true;[ AZE; GEO; IRN; TUR];·29743;🇲;{{ Armenian; Armenian};{ Arménienne; Arménien}}↵
{ American Samoa; American Samoa;{ eng:{ official: American Samoa; common: American Samoa}; smo:{ official: Sāmoa Amelika; common: Sāmoa Amelika}}};[ .as]; AS;·016; ASM; ASA;false; officially-assigned;false;;{ USD:{ name: United States dollar; symbol: $}};{ +1;[·684]};[ Pago Pago];[ AS; Amerika Sāmoa; Amelika Sāmoa; Sāmoa Amelika]; Oceania; Polynesia;{ eng: English; smo: Samoan};{{ ساموا الأمريكية; ساموا الأمريكية};{ Samoa Amerikan; Samoa Amerikan};{ Americká Samoa; Americká Samoa};{ Amerikanisch-Samoa; Amerikanisch-Samoa};{ Ameerika Samoa; Ameerika Samoa};{ Amerikan Samoa; Amerikan Samoa};{ Samoa américaines; Samoa américaines};{ amerka Samoa; Amerka Samoa};{ Szamoa; Szamoa};{ Samoa americane; Samoa Americane};{;メリ};{;};{ Amerikaans Samoa; Amerikaans Samoa};{ ساموآی آمریکا; ساموآی آمریکا};{ Samoa Amerykańskie; Samoa Amerykańskie};{ Samoa americana; Samoa Americana};{ американское Самоа; Американское Самоа};{ Americká Samoa; Americká Samoa};{ Samoa Americana; Samoa Americana};{ Amerka Samoa; Amerka Samoa};{ Amerikanska Samoa; Amerikanska Samoa};{ Amerikan Samoası; Amerikan Samoası};{ امریکی سمووا; امریکی سمووا};{;}};[ -14.33333333; -170];false;[];·199;🇸;{{ American Samoan; American Samoan};{ Samoane; Samoan}}↵
{ Antarctica; Antarctica;{}};[ .aq]; AQ;·010; ATA;;false; officially-assigned;false;;{};{;[]};[];[ AQ]; Antarctic;;{};{{ أنتارتيكا; أنتارتيكا};{ Antarktika; Antarktika};{ Antarktida; Antarktida};{ Antarktika; Antarktis};{ Antarktika; Antarktika};{ Etelämanner; Etelämanner};{ Antarctique; Antarctique};{ Antarktika; Antarktika};{ Antarktisz; Antarktisz};{ Antartide; Antartide};{;大陸};{;};{ Antarctica; Antarctica};{ جنوبگان; جنوبگان};{ Antarktyka; Antarktyka};{ Antártica; Antártida};{ Антарктида; Антарктида};{ Antarktída; Antarktída};{ Antártida; Antártida};{ Antarktik; Antarktik};{ Antarktis; Antarktis};{ Antarktika; Antarktika};{ انٹارکٹکا; انٹارکٹکا};{;}};[ -90;·0];false;[];·14000000;🇶;{{ Antarctican; Antarctican};{ Antarcticaine; Antarcticain}}↵
{ French Southern and Antarctic Lands; Territory of the French Southern and Antarctic Lands;{ fra:{ official: Territoire des Terres australes et antarctiques françaises; common: Terres australes et antarctiques françaises}}};[ .tf]; TF;·260; ATF;;false; officially-assigned;false;;{ EUR:{ name: Euro; symbol:}};{ +2;[·62]};[ Port-aux-Français];[ TF; French Southern Territories]; Antarctic;;{ fra: French};{{ مقاطعات وأقاليم ما وراء البحار الفرنسية; أراض فرنسية جنوبية وأنتارتيكية};{ Tiriad Douaroù Aostral hag Antarktikel Frañs; Douaroù Aostral hag Antarktikel Frañs};{ Teritorium Francouzská již a antarktická území; Francouzská již a antarktická území};{ Gebiet der Französisch Süd- und Antarktisgebiete; Französische Süd- und Antarktisgebiete};{ Prantsuse Lõunaalad; Prantsuse Lõunaalad};{ Ranskan eteläiset ja antarktiset alueet; Ranskan eteläiset ja antarktiset alueet};{ Territoire des Terres australes et antarctiques françaises; Terres australes et antarctiques françaises};{ Teritoriju Francuski južni i antarktički teritoriji; Francuski južni i antarktički teritoriji};{ Franciali és antarktiszi területek; Franciali és antarktiszi területek};{ Territorio della australi e antartiche francesi Terre; Territori Francesi del Sud};{ランス;ランス南方地域};{ 지역; 지역};{ Grondgebied van de Franse Zuidelijke en Antarctische gebieden; Franse Gebieden in de zuidelijke Indische Oceaan};{ سرزمینهای جنوبی و جنوبگانی فرانسه; سرزمینهای جنوبی و جنوبگانی فرانسه};{ Francuskie Terytoria Południowe i Antarktyczne; Francuskie Terytoria Południowe i Antarktyczne};{ Território do Sul e Antártica Francesa; Terras Austrais e Antárticas Francesas};{ Территория Французские Южные и Антарктические земли; Французские Южные и Антарктические территории};{ Francúzske juž a antarktické územia; Francúzske juŽ a antarktické územia};{ Territorio del Francés Tierras australes y antárticas; Tierras Australes y Antárticas Francesas};{ Francuske južne i antarktičke zemlje; Francuske južne i antarktičke zemlje};{ Franska syd- och Antarktisterritorierna; Franskadra territorierna};{ Fransızney ve Antarktika Toprakları; Fransızney ve Antarktika Toprakları};{ سرزمینِ جنوبی فرانسیسیہ و انٹارکٹیکہ; سرزمین جنوبی فرانسیسیہ و انٹارکٹیکا};{南部南极土地;南部南极土地}};[ -49.25;·69.167];false;[];·7747;🇫;{{ French; French};{ Française; Français}}↵
{ Antigua and Barbuda; Antigua and Barbuda;{ eng:{ official: Antigua and Barbuda; common: Antigua and Barbuda}}};[ .ag]; AG;·028; ATG; ANT;true; officially-assigned;true; Latin American and Caribbean Group;{ XCD:{ name: Eastern Caribbean dollar; symbol: $}};{ +1;[·268]};[ Saint John's];[ AG]; Americas; Caribbean;{ eng: English};{{ أنتيغوا وباربودا; أنتيغوا وباربودا};{ Antigua ha Barbuda; Antigua ha Barbuda};{ Antigua a Barbuda; Antigua a Barbuda};{ Antigua und Barbuda; Antigua und Barbuda};{ Antigua ja Barbuda; Antigua ja Barbuda};{ Antigua ja Barbuda; Antigua ja Barbuda};{ Antigua -et-Barbuda; Antigua-et-Barbuda};{ Antigva i Barbuda; Antigva i Barbuda};{ Antigua és Barbuda; Antigua és Barbuda};{ Antigua e Barbuda; Antigua e Barbuda};{ティー�ー�;ティー�ー�};{��;��};{ Antigua en Barbuda; Antigua en Barbuda};{ آنتیگوا و باربودا; آنتیگوا و باربودا};{ Antigua i Barbuda; Antigua i Barbuda};{ Antigua e Barbuda; Antígua e Barbuda};{ Антигуа и Барбуда; Антигуа и Барбуда};{ Antigua a Barbuda; Antigua a Barbuda};{ Antigua y Barbuda; Antigua y Barbuda};{ Antigva i Barbuda; Antigva i Barbuda};{ Antigua och Barbuda; Antigua och Barbuda};{ Antigua ve Barbuda; Antigua ve Barbuda};{ اینٹیگوا و باربوڈا; اینٹیگوا و باربوڈا};{;}};[·17.05; -61.8];false;[];·442;🇬;{{ Antiguan, Barbudan; Antiguan, Barbudan};{ Antiguaise et barbudienne; Antiguaise et barbudien}}↵
{ Australia; Commonwealth of Australia;{ eng:{ official: Commonwealth of Australia; common: Australia}}};[ .au]; AU;·036; AUS; AUS;true; officially-assigned;true; Western European and Others Group;{ AUD:{ name: Australian dollar; symbol: $}};{ +6;[·1]};[ Canberra];[ AU]; Oceania; Australia and New Zealand;{ eng: English};{{ كومونولث أستراليا; أستراليا};{ Kenglad Aostralia; Aostralia};{ Australské společenst; Austrálie};{ Commonwealth Australien; Australien};{ Austraalia Ühendus; Austraalia};{ Australian liittovaltio; Australia};{ Australie; Australie};{ Commonwealth of Australia; Australija};{ Ausztrál Államszövetség; Ausztrália};{ Commonwealth dell'Australia; Australia};{ーストラリア;ーストラリア};{스트;};{ Gemenebest van Austral; Austral};{ قلمرو همسود استرالیا; استرالیا};{ Związek Australijski; Australia};{ Comunidade da Austrália; Austrália};{ Содружество Австралии; Австралия};{ Austrálsky zz; Austrália};{ Mancomunidad de Australia; Australia};{ Komonvelt Australija; Australija};{ Australiska statsförbundet; Australien};{ Avustralya Federal Devleti; Avustralya};{ دولتِ مشترکہ آسٹریلیا; آسٹریلیا};{利亚联邦;利亚}};[ -27;·133];false;[];·7692024;🇺;{{ Australian; Australian};{ Australienne; Australien}}↵
{ Austria; Republic of Austria;{ bar:{ official: Republik Österreich; common: Österreich}}};[ .at]; AT;·040; AUT; AUT;true; officially-assigned;true; Western European and Others Group;{ EUR:{ name: Euro; symbol:}};{ +4;[·3]};[ Vienna];[ AT; Osterreich; Oesterreich]; Europe; Central Europe;{ bar: Austro-Bavarian German};{{ جمهورية النمسا; النمسا};{ Republik Aostria; Aostria};{ Rakouská republika; Rakousko};{ Republik Österreich; Österreich};{ Austria Vabariik; Austria};{ Itävallan tasavalta; Itävalta};{publique d'Autriche; Autriche};{ Republika Austrija; Austrija};{ Ausztria; Ausztria};{ Repubblica d'Austria; Austria};{ースリア共和国;ースリア};{스트;스트};{ Republiek Oostenrijk; Oostenrijk};{ جمهوری اتریش; اتریش};{ Republika Austrii; Austria};{ República da Áustria; Áustria};{ Австрийская Республика; Австрия};{ Rakúska republika; Rakúsko};{ República de Austria; Austria};{ Republika Austrija; Austrija};{ Republiken Österrike; Österrike};{ Avusturya Cumhuriyeti; Avusturya};{ جمہوریہ آسٹریا; آسٹریا};{共和国;}};[·47.33333333;·13.33333333];true;[ CZE; DEU; HUN; ITA; LIE; SVK; SVN; CHE];·83871;🇹;{{ Austrian; Austrian};{ Autrichienne; Autrichien}}↵
{ Azerbaijan; Republic of Azerbaijan;{ aze:{ official: Azərbaycan Respublikası; common: Azərbaycan}; rus:{ official: Азербайджанская Республика; common: Азербайджан}}};[ .az]; AZ;·031; AZE; AZE;true; officially-assigned;true; Eastern European Group;{ AZN:{ name: Azerbaijani manat; symbol:}};{ +9;[·94]};[ Baku];[ AZ; Republic of Azerbaijan; Azərbaycan Respublikası]; Asia; Western Asia;{ aze: Azerbaijani; rus: Russian};{{ جمهورية أذربيجان; أذربيجان};{ Republik Azerbaidjan; Azerbaidjan};{ Ázerbájdžánská republika; Ázerbájdžán};{ Republik Aserbaidschan; Aserbaidschan};{ Aserbaidžaani Vabariik; Aserbaidžaan};{ Azerbaidzanin tasavalta; Azerbaidzan};{publique d'Azerbaïdjan; Azerbaïdjan};{ Republika Azerbajdžan; Azerbajdžan};{ Azerbajdzsán; Azerbajdzsán};{ Repubblica dell'Azerbaigian; Azerbaijan};{バイジャン共和国;バイジャン};{;};{ Republiek Azerbeidzjan; Azerbeidzjan};{ جمهوری آذربایجان; جمهوری آذربایجان};{ Republika Azerbejdżanu; Azerbejdżan};{ República do Azerbaijão; Azerbeijão};{ Азербайджанская Республика; Азербайджан};{ Azerbajanská republika; Azerbajan};{ República de Azerbaiyán; Azerbaiyán};{ Republika Azerbejdžan; Azerbejdžan};{ Republiken Azerbajdzjan; Azerbajdzjan};{ Azerbaycan Cumhuriyeti; Azerbaycan};{ جمہوریہ آذربائیجان; آذربائیجان};{共和国;}};[·40.5;·47.5];true;[ ARM; GEO; IRN; RUS; TUR];·86600;🇿;{{ Azerbaijani; Azerbaijani};{ Azerbaïdjanaise; Azerbaïdjanais}}↵
{ Burundi; Republic of Burundi;{ fra:{ official:publique du Burundi; common: Burundi}; run:{ official: Republika y'Uburundi ; common: Uburundi}}};[ .bi]; BI;·108; BDI; BDI;true; officially-assigned;true; African Group;{ BIF:{ name: Burundian franc; symbol: Fr}};{ +2;[·57]};[ Gitega];[ BI; Republic of Burundi; Republika y'Uburundi;publique du Burundi]; Africa; Eastern Africa;{ fra: French; run: Kirundi};{{ جمهورية بوروندي; بوروندي};{ Republik Burundi; Burundi};{ Burundská republika; Burundi};{ Republik Burundi; Burundi};{ Burundi Vabariik; Burundi};{ Burundin tasavalta; Burundi};{publique du Burundi; Burundi};{ Burundi; Burundi};{ Burundi; Burundi};{ Repubblica del Burundi; Burundi};{共和国;};{;};{ Republiek Burundi; Burundi};{ جمهوری بوروندی; بوروندی};{ Republika Burundi; Burundi};{ República do Burundi; Burundi};{ Республика Бурунди; Бурунди};{ Burundská republika; Burundi};{ República de Burundi; Burundi};{ Republika Burundi; Burundi};{ Republiken Burundi; Burundi};{ Burundi Cumhuriyeti; Burundi};{ جمہوریہ برونڈی; برونڈی};{共和国;}};[ -3.5;·30];true;[ COD; RWA; TZA];·27834;🇮;{{ Burundian; Burundian};{ Burundaise; Burundais}}↵
{ Belgium; Kingdom of Belgium;{ deu:{ official: Königreich Belgien; common: Belgien}; fra:{ official: Royaume de Belgique; common: Belgique}; nld:{ official: Koninkrijk België; common: België}}};[ .be]; BE;·056; BEL; BEL;true; officially-assigned;true; Western European and Others Group;{ EUR:{ name: Euro; symbol:}};{ +3;[·2]};[ Brussels];[ BE; België; Belgie; Belgien; Belgique; Kingdom of Belgium; Koninkrijk België; Royaume de Belgique; Königreich Belgien]; Europe; Western Europe;{ deu: German; fra: French; nld: Dutch};{{ مملكة بلجيكا; بلجيكا};{ Rouantelezh Belgia; Belgia};{ Belgické královst; Belgie};{ Königreich Belgien; Belgien};{ Belgia Kuningriik; Belgia};{ Belgian kuningaskunta; Belgia};{ Royaume de Belgique; Belgique};{ Kraljevina Belgija; Belgija};{ Belga Királyság; Belgium};{ Regno del Belgio; Belgio};{王国;};{기에;기에};{ Koninkrijk België; België};{ پادشاهی بلژیک; بلژیک};{ Królestwo Belgii; Belgia};{ Reino da Bélgica; Bélgica};{ Королевство Бельгия; Бельгия};{ Belgické kráľovstvo; Belgicko};{ Reino de Bélgica; Bélgica};{ Kraljevina Belgija; Belgija};{ Konungariket Belgien; Belgien};{ Belçika Krallığı; Belçika};{ مملکتِ بلجئیم; بلجئیم};{王国;}};[·50.83333333;·4];false;[ FRA; DEU; LUX; NLD];·30528;🇪;{{ Belgian; Belgian};{ Belge; Belge}}↵
{ Benin; Republic of Benin;{ fra:{ official:publique du Bénin; common: Bénin}}};[ .bj]; BJ;·204; BEN; BEN;true; officially-assigned;true; African Group;{ XOF:{ name: West African CFA franc; symbol: Fr}};{ +2;[·29]};[ Porto-Novo];[ BJ; Republic of Benin;publique du Bénin]; Africa; Western Africa;{ fra: French};{{ جمهورية بنين; بنين};{ Republik Benin; Benin};{ Beninská republika; Benin};{ Republik Benin; Benin};{ Benini Vabariik; Benin};{ Beninin tasavalta; Benin};{publique du Bénin; Bénin};{ Republika Benin; Benin};{ Beniniztársaság; Benin};{ Repubblica del Benin; Benin};{ナン共和国;ナン};{;};{ Republiek Benin; Benin};{ جمهوری بنین; بنین};{ Benin; Benin};{ República do Benin; Benin};{ Республика Бенин; Бенин};{ Beninská republika; Benin};{ República de Benin; Benín};{ Republika Benin; Benin};{ Republiken Benin; Benin};{ Benin Cumhuriyeti; Benin};{ جمہوریہ بینن; بینن};{共和国;}};[·9.5;·2.25];false;[ BFA; NER; NGA; TGO];·112622;🇯;{{ Beninese; Beninese};{ Béninoise; Béninois}}↵
{ Burkina Faso; Burkina Faso;{ fra:{ official:publique du Burkina; common: Burkina Faso}}};[ .bf]; BF;·854; BFA; BUR;true; officially-assigned;true; African Group;{ XOF:{ name: West African CFA franc; symbol: Fr}};{ +2;[·26]};[ Ouagadougou];[ BF]; Africa; Western Africa;{ fra: French};{{ بوركينا فاسو; بوركينا فاسو};{ Burkina Faso; Burkina Faso};{ Burkina Faso; Burkina Faso};{ Burkina Faso; Burkina Faso};{ Burkina Faso; Burkina Faso};{ Burkina Faso; Burkina Faso};{publique du Burkina; Burkina Faso};{ Burkina Faso; Burkina Faso};{ Burkina Faso; Burkina};{ Burkina Faso; Burkina Faso};{ファ;ファ};{;};{ Burkina Faso; Burkina Faso};{ بورکینافاسو; بورکینافاسو};{ Burkina Faso; Burkina Faso};{ Burkina Faso; Burkina Faso};{ Буркина -Фасо; Буркина-Фасо};{ Burkina Faso; Burkina Faso};{ Burkina Faso; Burkina Faso};{ Burkina Faso; Burkina Faso};{ Burkina Faso; Burkina Faso};{ Burkina Faso; Burkina Faso};{ برکینا فاسو; برکینا فاسو};{;}};[·13; -2];true;[ BEN; CIV; GHA; MLI; NER; TGO];·272967;🇫;{{ Burkinabe; Burkinabe};{ Burkinabée; Burkinabé}}↵
{ Bangladesh; People's Republic of Bangladesh;{ ben:{ official:া�া�্�া�্�্�; common:া�া�}}};[ .bd]; BD;·050; BGD; BAN;true; officially-assigned;true; Asia and the Pacific Group;{ BDT:{ name: Bangladeshi taka; symbol:·}};{ +8;[·80]};[ Dhaka];[ BD; People's Republic of Bangladesh; Gônôprôjatôntri Bangladesh]; Asia; Southern Asia;{ ben: Bengali};{{ جمهورية بنغلاديش الشعبية; بنغلاديش};{ Republik pobl Bangladesh; Bangladesh};{ Bangladéšská lidová republika; Bangladéš};{ Volksrepublik Bangladesch; Bangladesch};{ Bangladeshi Rahvavabariik; Bangladesh};{ Bangladeshin kansantasavalta; Bangladesh};{ Lapublique populaire du Bangladesh; Bangladesh};{ Narodna Republika Bangladeš; Bangladeš};{ Banglades; Banglades};{ Repubblica popolare del Bangladesh; Bangladesh};{ングシュ人民共和国;ングシュ};{;};{ Volksrepubliek Bangladesh; Bangladesh};{ جمهوری خلق بنگلادش; بنگلادش};{ Ludowa Republika Bangladeszu; Bangladesz};{ República Popular do Bangladesh; Bangladesh};{ Народная Республика Бангладеш; Бангладеш};{ Bangladéšskaudová republika; Bangladéš};{ República Popular de Bangladesh; Bangladesh};{ Narodna Republika Bangladeš; Bangladeš};{ Folkrepubliken Bangladesh; Bangladesh};{ Bangladeş Halk Cumhuriyeti; Bangladeş};{ عوامی جمہوریہ بنگلہ دیش; بنگلہ دیش};{人民共和国;}};[·24;·90];false;[ MMR; IND];·147570;🇩;{{ Bangladeshi; Bangladeshi};{ Bangladaise; Bangladais}}↵
{ Bulgaria; Republic of Bulgaria;{ bul:{ official: Република България; common: България}}};[ .bg]; BG;·100; BGR; BUL;true; officially-assigned;true; Eastern European Group;{ BGN:{ name: Bulgarian lev; symbol: лв}};{ +3;[·59]};[ Sofia];[ BG; Republic of Bulgaria; Република България]; Europe; Southeast Europe;{ bul: Bulgarian};{{ جمهورية بلغاريا; بلغاريا};{ Republik Bulgaria; Bulgaria};{ Bulharská republika; Bulharsko};{ Republik Bulgarien; Bulgarien};{ Bulgaaria Vabariik; Bulgaaria};{ Bulgarian tasavalta; Bulgaria};{publique de Bulgarie; Bulgarie};{ Republika Bugarska; Bugarska};{ Bolgárztársaság; Bulgária};{ Repubblica di Bulgaria; Bulgaria};{リア共和国;リア};{;};{ Republiek Bulgarije; Bulgarije};{ جمهوری بلغارستان; بلغارستان};{ Republika Bułgarii; Bułgaria};{ República da Bulgária; Bulgária};{ Республика Болгария; Болгария};{ Bulharská republika; Bulharsko};{ República de Bulgaria; Bulgaria};{ Republika Bugarska; Bugarska};{ Republiken Bulgarien; Bulgarien};{ Bulgaristan Cumhuriyeti; Bulgaristan};{ جمہوریہ بلغاریہ; بلغاریہ};{·利亚共和国;·利亚}};[·43;·25];false;[ GRC; MKD; ROU; SRB; TUR];·110879;🇬;{{ Bulgarian; Bulgarian};{ Bulgare; Bulgare}}↵
{ Bahrain; Kingdom of Bahrain;{ ara:{ official: مملكة البحرين; common: البحرين}}};[ .bh]; BH;·048; BHR; BRN;true; officially-assigned;true; Asia and the Pacific Group;{ BHD:{ name: Bahraini dinar; symbol: .د.ب}};{ +9;[·73]};[ Manama];[ BH; Kingdom of Bahrain; Mamlakat al-Barayn]; Asia; Western Asia;{ ara: Arabic};{{ مملكة البحرين; البحرين};{ Rouantelezh Bahrein; Bahrein};{ Královst Bahrajn; Bahrajn};{ Königreich Bahrain; Bahrain};{ Bahreini Kuningriik; Bahrein};{ Bahrainin kuningaskunta; Bahrain};{ Royaume de Bahreïn; Bahreïn};{ Kraljevina Bahrein; Bahrein};{ Bahreini Királyság; Bahrein};{ Regno del Bahrain; Bahrein};{ー�ーン王国;ー�ーン};{;};{ Koninkrijk Bahrein; Bahrein};{ پادشاهی بحرین; بحرین};{ Królestwo Bahrajnu; Bahrajn};{ Reino do Bahrein; Bahrein};{ Королевство Бахрейн; Бахрейн};{ Bahrajnské kráľovstvo; Bahrajn};{ Reino de Bahrein; Bahrein};{ Kraljevina Bahrein; Bahrein};{ Konungariket Bahrain; Bahrain};{ Bahreyn Krallığı; Bahreyn};{ مملکتِ بحرین; بحرین};{王国;}};[·26;·50.55];false;[];·765;🇭;{{ Bahraini; Bahraini};{ Bahreïnienne; Bahreïnien}}
... (truncated)
minemizer (compact)
chars: 299,485 tokens: 133,597 chars_og/tok: 8.5 enc_chars/tok: 2.2
name{common;official;native{...}};tld[];cca2;ccn3;cca3;cioc;independent;status;unMember;unRegionalGroup;currencies{...};idd{root;suffixes[]};capital[];altSpellings[];region;subregion;languages{...};translations{ara{official;common};bre{official;common};ces{official;common};deu{official;common};est{official;common};fin{official;common};fra{official;common};hrv{official;common};hun{official;common};ita{official;common};jpn{official;common};kor{official;common};nld{official;common};per{official;common};pol{official;common};por{official;common};rus{official;common};slk{official;common};spa{official;common};srp{official;common};swe{official;common};tur{official;common};urd{official;common};zho{official;common}};latlng[];landlocked;borders[];area;flag;demonyms{eng{f;m};fra{f;m}}↵
{Aruba;Aruba;{nld:{official:Aruba;common:Aruba};pap:{official:Aruba;common:Aruba}}};[.aw];AW;533;ABW;ARU;false;officially-assigned;false;;{AWG:{name:Aruban florin;symbol:ƒ}};{+2;[97]};[Oranjestad];[AW];Americas;Caribbean;{nld:Dutch;pap:Papiamento};{{أروبا;أروبا};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{アルバ;アルバ};{;};{Aruba;Aruba};{آروبا;آروبا};{Aruba;Aruba};{Aruba;Aruba};{Аруба;Аруба};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{اروبا;اروبا};{;}};[12.5;-69.96666666];false;[];180;🇦🇼;{{Aruban;Aruban};{Arubaise;Arubais}}↵
{Afghanistan;Islamic Republic of Afghanistan;{prs:{official:جمهوری اسلامی افغانستان;common:افغانستان};pus:{official:د افغانستان اسلامي جمهوریت;common:افغانستان};tuk:{official:Owganystan Yslam Respublikasy;common:Owganystan}}};[.af];AF;004;AFG;AFG;true;officially-assigned;true;Asia and the Pacific Group;{AFN:{name:Afghan afghani;symbol:}};{+9;[3]};[Kabul];[AF;Afġānistān];Asia;Southern Asia;{prs:Dari;pus:Pashto;tuk:Turkmen};{{جمهورية أففانستان الإسلامية;أفغانستان};{Republik Islamek Afghanistan;Afghanistan};{Afghánská islámská republika;Afghánistán};{Islamische Republik Afghanistan;Afghanistan};{Afganistani Islamivabariik;Afganistan};{Afganistanin islamilainen tasavalta;Afganistan};{publique islamique d'Afghanistan;Afghanistan};{Islamska Republika Afganistan;Afganistan};{Afganisztáni Iszlámztársaság;Afganisztán};{Repubblica islamica dell'Afghanistan;Afghanistan};{フ�スタンイス共和国;フ�スタン};{;};{Islamitische Republiek Afghanistan;Afghanistan};{جمهوری اسلامی افغانستان;افغانستان};{Islamska Republika Afganistanu;Afganistan};{República Islâmica do Afeganistão;Afeganistão};{Исламская Республика Афганистан;Афганистан};{Afgánsky islamský štát;Afganistan};{República Islámica de Afganistán;Afganistán};{Islamska Republika Avganistan;Avganistan};{Islamiska republiken Afghanistan;Afghanistan};{Afganistan İslam Cumhuriyeti;Afganistan};{اسلامی جمہوریہ افغانستان;افغانستان};{阿富汗伊斯兰共和国;阿富汗}};[33;65];true;[IRN;PAK;TKM;UZB;TJK;CHN];652230;🇦🇫;{{Afghan;Afghan};{Afghane;Afghan}}↵
{Angola;Republic of Angola;{por:{official:República de Angola;common:Angola}}};[.ao];AO;024;AGO;ANG;true;officially-assigned;true;African Group;{AOA:{name:Angolan kwanza;symbol:Kz}};{+2;[44]};[Luanda];[AO;República de Angola;ʁɛpublika de an'ɡɔla];Africa;Middle Africa;{por:Portuguese};{{أنغولا;جمهورية أنغولا};{Republik Angola;Angola};{Angolská republika;Angola};{Republik Angola;Angola};{Angola Vabariik;Angola};{Angolan tasavalta;Angola};{publique d'Angola;Angola};{Republika Angola;Angola};{Angola;Angola};{Repubblica dell'Angola;Angola};{アン共和国;アン};{;};{Republiek Angola;Angola};{جمهوری آنگولا;آنگولا};{Republika Angoli;Angola};{República de Angola;Angola};{Республика Ангола;Ангола};{Angolská republika;Angola};{República de Angola;Angola};{Republika Angola;Angola};{Republiken Angola;Angola};{Angola Cumhuriyeti;Angola};{جمہوریہ انگولہ;انگولہ};{共和国;}};[-12.5;18.5];false;[COG;COD;ZMB;NAM];1246700;🇦🇴;{{Angolan;Angolan};{Angolaise;Angolais}}↵
{Anguilla;Anguilla;{eng:{official:Anguilla;common:Anguilla}}};[.ai];AI;660;AIA;;false;officially-assigned;false;;{XCD:{name:Eastern Caribbean dollar;symbol:$}};{+1;[264]};[The Valley];[AI];Americas;Caribbean;{eng:English};{{أنغويلا;أنغويلا};{Anguilla;Anguilla};{Anguilla;Anguilla};{Anguilla;Anguilla};{Anguilla;Anguilla};{Anguilla;Anguilla};{Anguilla;Anguilla};{Anguilla;Angvila};{Anguilla;Anguilla};{Anguilla;Anguilla};{アン;アン};{;};{Anguilla;Anguilla};{آنگویلا;آنگویلا};{Anguilla;Anguilla};{Anguilla;Anguilla};{Ангилья;Ангилья};{Anguilla;Anguilla};{Anguila;Anguilla};{Angvila;Angvila};{Anguilla;Anguilla};{Anguilla;Anguilla};{اینگویلا;اینگویلا};{;}};[18.25;-63.16666666];false;[];91;🇦🇮;{{Anguillian;Anguillian};{Anguillane;Anguillan}}↵
{Åland Islands;Åland Islands;{swe:{official:Landskapet Åland;common:Åland}}};[.ax];AX;248;ALA;;false;officially-assigned;false;;{EUR:{name:Euro;symbol:}};{+3;[5818]};[Mariehamn];[AX;Aaland;Aland;Ahvenanmaa];Europe;Northern Europe;{swe:Swedish};{{جزر أولاند;جزر أولاند};{Inizi Åland;Åland};{Ålandské ostrovy;Ålandy};{Åland-Inseln;Åland};{Ahvenamaa maakond;Ahvenamaa};{Ahvenanmaan maakunta;Ahvenanmaa};{Ahvenanmaa;Ahvenanmaa};{Aland Islands;Ålandski otoci};{Åland-szigetek;Åland-szigetek};{Isole Åland;Isole Aland};{ー�ンド;ー�ンド};{;};{Åland eilanden;Ålandeilanden};{جزایر الند;جزایر الند};{Wyspy Alandzkie;Wyspy Alandzkie};{Ilhas Åland;Alândia};{Аландские острова;Аландские острова};{Alandské ostrovy;Alandy};{Islas Åland;Alandia};{Olandska Ostrva;Olandska Ostrva};{Åland;Åland};{Åland Adaları;Åland};{جزائر اولند;جزائر اولند};{群岛;群岛}};[60.116667;19.9];false;[];1580;🇦🇽;{{Ålandish;Ålandish};{Ålandaise;Ålandais}}↵
{Albania;Republic of Albania;{sqi:{official:Republika e Shqipërisë;common:Shqipëria}}};[.al];AL;008;ALB;ALB;true;officially-assigned;true;Eastern European Group;{ALL:{name:Albanian lek;symbol:L}};{+3;[55]};[Tirana];[AL;Shqipëri;Shqipëria;Shqipnia];Europe;Southeast Europe;{sqi:Albanian};{{جمهورية ألبانيا;ألبانيا};{Republik Albania;Albania};{Albánská republika;Albánie};{Republik Albanien;Albanien};{Albaania Vabariik;Albaania};{Albanian tasavalta;Albania};{publique d'Albanie;Albanie};{Republika Albanija;Albanija};{Albánztársaság;Albánia};{Repubblica d'Albania;Albania};{アルバニア共和国;アルバニア};{;};{Republiek Albanië;Albanië};{جمهوری آلبانی;آلبانی};{Republika Albanii;Albania};{República da Albânia;Albânia};{Республика Албания;Албания};{Albánska republika;Albánsko};{República de Albania;Albania};{Republika Albanija;Albanija};{Republiken Albanien;Albanien};{Arnavutluk Cumhuriyeti;Arnavutluk};{جمہوریہ البانیا;البانیا};{阿尔尼亚共和国;阿尔尼亚}};[41;20];false;[MNE;GRC;MKD;UNK];28748;🇦🇱;{{Albanian;Albanian};{Albanaise;Albanais}}↵
{Andorra;Principality of Andorra;{cat:{official:Principat d'Andorra;common:Andorra}}};[.ad];AD;020;AND;AND;true;officially-assigned;true;Western European and Others Group;{EUR:{name:Euro;symbol:}};{+3;[76]};[Andorra la Vella];[AD;Principality of Andorra;Principat d'Andorra];Europe;Southern Europe;{cat:Catalan};{{إمارة أندورا;أندورا};{Priñselezh Andorra;Andorra};{Andorrské knížect;Andorra};{Fürstentum Andorra;Andorra};{Andorra Vürstiriik;Andorra};{Andorran ruhtinaskunta;Andorra};{Principauté d'Andorre;Andorre};{Kneževina Andora;Andora};{Andorra;Andorra};{Principato di Andorra;Andorra};{ンド;ンド};{;};{Prinsdom Andorra;Andorra};{شاهزادهنشین آندورا;آندورا};{Księstwo Andory;Andora};{Principado de Andorra;Andorra};{Княжество Андорра;Андорра};{Andorrské kniežatstvo;Andorra};{Principado de Andorra;Andorra};{Kneževina Andora;Andora};{Furstendömet Andorra;Andorra};{Andorra Prensliği;Andorra};{اماراتِ انڈورا;انڈورا};{;}};[42.5;1.5];true;[FRA;ESP];468;🇦🇩;{{Andorran;Andorran};{Andorrane;Andorran}}↵
{United Arab Emirates;United Arab Emirates;{ara:{official:الإمارات العربية المتحدة;common:الإمارات}}};[.ae;امارات.];AE;784;ARE;UAE;true;officially-assigned;true;Asia and the Pacific Group;{AED:{name:United Arab Emirates dirham;symbol:د.إ}};{+9;[71]};[Abu Dhabi];[AE;UAE;Emirates];Asia;Western Asia;{ara:Arabic};{{الإمارات العربية المتحدة;الإمارات};{Emirelezhioù Arab Unanet;Emirelezhioù Arab Unanet};{Spojené arabské emiráty;Spojené arabské emiráty};{Vereinigte Arabische Emirate;Vereinigte Arabische Emirate};{Araabia Ühendemiraadid;Araabia Ühendemiraadid};{Yhdistyneet arabiemiirikunnat;Arabiemiraatit};{Émirats arabes unis;Émirats arabes unis};{Ujedinjeni Arapski Emirati;Ujedinjeni Arapski Emirati};{Egyesült Arab Emírségek;Egyesült Arab Emírségek};{Emirati Arabi Uniti;Emirati Arabi Uniti};{;UAE};{����;};{Verenigde Arabische Emiraten;Verenigde Arabische Emiraten};{امارات متحده عربی;امارات};{Zjednoczone Emiraty Arabskie;Zjednoczone Emiraty Arabskie};{Emirados Árabes Unidos;Emirados Árabes Unidos};{Объединенные Арабские Эмираты;Объединённые Арабские Эмираты};{Spojené arabské emiráty;Spojené arabské emiráty};{Emiratos Árabes Unidos;Emiratos Árabes Unidos};{Ujedinjeni Arapski Emirati;Ujedinjeni Arapski Emirati};{Förenade Arabemiraten;Förenade Arabemiraten};{Birleşik Arap Emirlikleri;Birleşik Arap Emirlikleri};{متحدہ عرب امارات;متحدہ عرب امارات};{阿拉伯联合;阿拉伯联合}};[24;54];false;[OMN;SAU];83600;🇦🇪;{{Emirati;Emirati};{Emirienne;Emirien}}↵
{Argentina;Argentine Republic;{grn:{official:Argentine Republic;common:Argentina};spa:{official:República Argentina;common:Argentina}}};[.ar];AR;032;ARG;ARG;true;officially-assigned;true;Latin American and Caribbean Group;{ARS:{name:Argentine peso;symbol:$}};{+5;[4]};[Buenos Aires];[AR;Argentine Republic;República Argentina];Americas;South America;{grn:Guaraní;spa:Spanish};{{جمهورية الأرجنتين;الأرجنتين};{Republik Arc'hantina;Arc'hantina};{Argentinská republika;Argentina};{Argentinische Republik;Argentinien};{Argentina Vabariik;Argentina};{Argentiinan tasavalta;Argentiina};{publique argentine;Argentine};{Argentinski Republika;Argentina};{Argentinztársaság;Argentína};{Repubblica Argentina;Argentina};{アルチン共和国;アルチン};{;};{Argentijnse Republiek;Argentinië};{جمهوری آرژانتین;آرژانتین};{Republika Argentyńska;Argentyna};{República Argentina;Argentina};{Аргентинская Республика;Аргентина};{Argentínska republika;Argentína};{República Argentina;Argentina};{Republika Argentina;Argentina};{Republiken Argentina;Argentina};{Arjantin Cumhuriyeti;Arjantin};{جمہوریہ ارجنٹائن;ارجنٹائن};{阿根廷共和国;阿根廷}};[-34;-64];false;[BOL;BRA;CHL;PRY;URY];2780400;🇦🇷;{{Argentine;Argentine};{Argentine;Argentin}}↵
{Armenia;Republic of Armenia;{hye:{official:Հայաստանի·Հանրապետություն;common:Հայաստան}}};[.am];AM;051;ARM;ARM;true;officially-assigned;true;Eastern European Group;{AMD:{name:Armenian dram;symbol:}};{+3;[74]};[Yerevan];[AM;Hayastan;Republic of Armenia;Հայաստանի·Հանրապետություն];Asia;Western Asia;{hye:Armenian};{{جمهورية أرمينيا;أرمينيا};{Republik Armenia;Armenia};{Arménská republika;Arménie};{Republik Armenien;Armenien};{Armeenia Vabariik;Armeenia};{Armenian tasavalta;Armenia};{publique d'Arménie;Arménie};{Republika Armenija;Armenija};{Örményország;Örményország};{Repubblica di Armenia;Armenia};{アルニア共和国;アルニア};{;};{Republiek Armen;Armen};{جمهوری ارمنستان;ارمنستان};{Republika Armenii;Armenia};{República da Arménia;Arménia};{Республика Армения;Армения};{Arménska republika;Arménsko};{República de Armenia;Armenia};{Republika Jermenija;Jermenija};{Republiken Armenien;Armenien};{Ermenistan Cumhuriyeti;Ermenistan};{جمہوریہ آرمینیا;آرمینیا};{尼亚共和国;尼亚}};[40;45];true;[AZE;GEO;IRN;TUR];29743;🇦🇲;{{Armenian;Armenian};{Arménienne;Arménien}}↵
{American Samoa;American Samoa;{eng:{official:American Samoa;common:American Samoa};smo:{official:Sāmoa Amelika;common:Sāmoa Amelika}}};[.as];AS;016;ASM;ASA;false;officially-assigned;false;;{USD:{name:United States dollar;symbol:$}};{+1;[684]};[Pago Pago];[AS;Amerika Sāmoa;Amelika Sāmoa;Sāmoa Amelika];Oceania;Polynesia;{eng:English;smo:Samoan};{{ساموا الأمريكية;ساموا الأمريكية};{Samoa Amerikan;Samoa Amerikan};{Americká Samoa;Americká Samoa};{Amerikanisch-Samoa;Amerikanisch-Samoa};{Ameerika Samoa;Ameerika Samoa};{Amerikan Samoa;Amerikan Samoa};{Samoa américaines;Samoa américaines};{amerka Samoa;Amerka Samoa};{Szamoa;Szamoa};{Samoa americane;Samoa Americane};{;アメリカ};{;};{Amerikaans Samoa;Amerikaans Samoa};{ساموآی آمریکا;ساموآی آمریکا};{Samoa Amerykańskie;Samoa Amerykańskie};{Samoa americana;Samoa Americana};{американское Самоа;Американское Самоа};{Americká Samoa;Americká Samoa};{Samoa Americana;Samoa Americana};{Amerka Samoa;Amerka Samoa};{Amerikanska Samoa;Amerikanska Samoa};{Amerikan Samoası;Amerikan Samoası};{امریکی سمووا;امریکی سمووا};{;}};[-14.33333333;-170];false;[];199;🇦🇸;{{American Samoan;American Samoan};{Samoane;Samoan}}↵
{Antarctica;Antarctica;{}};[.aq];AQ;010;ATA;;false;officially-assigned;false;;{};{;[]};[];[AQ];Antarctic;;{};{{أنتارتيكا;أنتارتيكا};{Antarktika;Antarktika};{Antarktida;Antarktida};{Antarktika;Antarktis};{Antarktika;Antarktika};{Etelämanner;Etelämanner};{Antarctique;Antarctique};{Antarktika;Antarktika};{Antarktisz;Antarktisz};{Antartide;Antartide};{;大陸};{;};{Antarctica;Antarctica};{جنوبگان;جنوبگان};{Antarktyka;Antarktyka};{Antártica;Antártida};{Антарктида;Антарктида};{Antarktída;Antarktída};{Antártida;Antártida};{Antarktik;Antarktik};{Antarktis;Antarktis};{Antarktika;Antarktika};{انٹارکٹکا;انٹارکٹکا};{南极;南极}};[-90;0];false;[];14000000;🇦🇶;{{Antarctican;Antarctican};{Antarcticaine;Antarcticain}}↵
{French Southern and Antarctic Lands;Territory of the French Southern and Antarctic Lands;{fra:{official:Territoire des Terres australes et antarctiques françaises;common:Terres australes et antarctiques françaises}}};[.tf];TF;260;ATF;;false;officially-assigned;false;;{EUR:{name:Euro;symbol:}};{+2;[62]};[Port-aux-Français];[TF;French Southern Territories];Antarctic;;{fra:French};{{مقاطعات وأقاليم ما وراء البحار الفرنسية;أراض فرنسية جنوبية وأنتارتيكية};{Tiriad Douaroù Aostral hag Antarktikel Frañs;Douaroù Aostral hag Antarktikel Frañs};{Teritorium Francouzská již a antarktická území;Francouzská již a antarktická území};{Gebiet der Französisch Süd- und Antarktisgebiete;Französische Süd- und Antarktisgebiete};{Prantsuse Lõunaalad;Prantsuse Lõunaalad};{Ranskan eteläiset ja antarktiset alueet;Ranskan eteläiset ja antarktiset alueet};{Territoire des Terres australes et antarctiques françaises;Terres australes et antarctiques françaises};{Teritoriju Francuski južni i antarktički teritoriji;Francuski južni i antarktički teritoriji};{Franciali és antarktiszi területek;Franciali és antarktiszi területek};{Territorio della australi e antartiche francesi Terre;Territori Francesi del Sud};{フランス;フランス南方地域};{ 지역; 지역};{Grondgebied van de Franse Zuidelijke en Antarctische gebieden;Franse Gebieden in de zuidelijke Indische Oceaan};{سرزمینهای جنوبی و جنوبگانی فرانسه;سرزمینهای جنوبی و جنوبگانی فرانسه};{Francuskie Terytoria Południowe i Antarktyczne;Francuskie Terytoria Południowe i Antarktyczne};{Território do Sul e Antártica Francesa;Terras Austrais e Antárticas Francesas};{Территория Французские Южные и Антарктические земли;Французские Южные и Антарктические территории};{Francúzske juž a antarktické územia;Francúzske juŽ a antarktické územia};{Territorio del Francés Tierras australes y antárticas;Tierras Australes y Antárticas Francesas};{Francuske južne i antarktičke zemlje;Francuske južne i antarktičke zemlje};{Franska syd- och Antarktisterritorierna;Franskadra territorierna};{Fransızney ve Antarktika Toprakları;Fransızney ve Antarktika Toprakları};{سرزمینِ جنوبی فرانسیسیہ و انٹارکٹیکہ;سرزمین جنوبی فرانسیسیہ و انٹارکٹیکا};{法国南部南极土地;法国南部南极土地}};[-49.25;69.167];false;[];7747;🇹🇫;{{French;French};{Française;Français}}↵
{Antigua and Barbuda;Antigua and Barbuda;{eng:{official:Antigua and Barbuda;common:Antigua and Barbuda}}};[.ag];AG;028;ATG;ANT;true;officially-assigned;true;Latin American and Caribbean Group;{XCD:{name:Eastern Caribbean dollar;symbol:$}};{+1;[268]};[Saint John's];[AG];Americas;Caribbean;{eng:English};{{أنتيغوا وباربودا;أنتيغوا وباربودا};{Antigua ha Barbuda;Antigua ha Barbuda};{Antigua a Barbuda;Antigua a Barbuda};{Antigua und Barbuda;Antigua und Barbuda};{Antigua ja Barbuda;Antigua ja Barbuda};{Antigua ja Barbuda;Antigua ja Barbuda};{Antigua -et-Barbuda;Antigua-et-Barbuda};{Antigva i Barbuda;Antigva i Barbuda};{Antigua és Barbuda;Antigua és Barbuda};{Antigua e Barbuda;Antigua e Barbuda};{アンティー�ー�;アンティー�ー�};{��;��};{Antigua en Barbuda;Antigua en Barbuda};{آنتیگوا و باربودا;آنتیگوا و باربودا};{Antigua i Barbuda;Antigua i Barbuda};{Antigua e Barbuda;Antígua e Barbuda};{Антигуа и Барбуда;Антигуа и Барбуда};{Antigua a Barbuda;Antigua a Barbuda};{Antigua y Barbuda;Antigua y Barbuda};{Antigva i Barbuda;Antigva i Barbuda};{Antigua och Barbuda;Antigua och Barbuda};{Antigua ve Barbuda;Antigua ve Barbuda};{اینٹیگوا و باربوڈا;اینٹیگوا و باربوڈا};{;}};[17.05;-61.8];false;[];442;🇦🇬;{{Antiguan, Barbudan;Antiguan, Barbudan};{Antiguaise et barbudienne;Antiguaise et barbudien}}↵
{Australia;Commonwealth of Australia;{eng:{official:Commonwealth of Australia;common:Australia}}};[.au];AU;036;AUS;AUS;true;officially-assigned;true;Western European and Others Group;{AUD:{name:Australian dollar;symbol:$}};{+6;[1]};[Canberra];[AU];Oceania;Australia and New Zealand;{eng:English};{{كومونولث أستراليا;أستراليا};{Kenglad Aostralia;Aostralia};{Australské společenst;Austrálie};{Commonwealth Australien;Australien};{Austraalia Ühendus;Austraalia};{Australian liittovaltio;Australia};{Australie;Australie};{Commonwealth of Australia;Australija};{Ausztrál Államszövetség;Ausztrália};{Commonwealth dell'Australia;Australia};{ーストラリア;ーストラリア};{스트;};{Gemenebest van Austral;Austral};{قلمرو همسود استرالیا;استرالیا};{Związek Australijski;Australia};{Comunidade da Austrália;Austrália};{Содружество Австралии;Австралия};{Austrálsky zz;Austrália};{Mancomunidad de Australia;Australia};{Komonvelt Australija;Australija};{Australiska statsförbundet;Australien};{Avustralya Federal Devleti;Avustralya};{دولتِ مشترکہ آسٹریلیا;آسٹریلیا};{澳大利亚联邦;澳大利亚}};[-27;133];false;[];7692024;🇦🇺;{{Australian;Australian};{Australienne;Australien}}↵
{Austria;Republic of Austria;{bar:{official:Republik Österreich;common:Österreich}}};[.at];AT;040;AUT;AUT;true;officially-assigned;true;Western European and Others Group;{EUR:{name:Euro;symbol:}};{+4;[3]};[Vienna];[AT;Osterreich;Oesterreich];Europe;Central Europe;{bar:Austro-Bavarian German};{{جمهورية النمسا;النمسا};{Republik Aostria;Aostria};{Rakouská republika;Rakousko};{Republik Österreich;Österreich};{Austria Vabariik;Austria};{Itävallan tasavalta;Itävalta};{publique d'Autriche;Autriche};{Republika Austrija;Austrija};{Ausztria;Ausztria};{Repubblica d'Austria;Austria};{ースリア共和国;ースリア};{스트;스트};{Republiek Oostenrijk;Oostenrijk};{جمهوری اتریش;اتریش};{Republika Austrii;Austria};{República da Áustria;Áustria};{Австрийская Республика;Австрия};{Rakúska republika;Rakúsko};{República de Austria;Austria};{Republika Austrija;Austrija};{Republiken Österrike;Österrike};{Avusturya Cumhuriyeti;Avusturya};{جمہوریہ آسٹریا;آسٹریا};{奥地利共和国;奥地利}};[47.33333333;13.33333333];true;[CZE;DEU;HUN;ITA;LIE;SVK;SVN;CHE];83871;🇦🇹;{{Austrian;Austrian};{Autrichienne;Autrichien}}↵
{Azerbaijan;Republic of Azerbaijan;{aze:{official:Azərbaycan Respublikası;common:Azərbaycan};rus:{official:Азербайджанская Республика;common:Азербайджан}}};[.az];AZ;031;AZE;AZE;true;officially-assigned;true;Eastern European Group;{AZN:{name:Azerbaijani manat;symbol:}};{+9;[94]};[Baku];[AZ;Republic of Azerbaijan;Azərbaycan Respublikası];Asia;Western Asia;{aze:Azerbaijani;rus:Russian};{{جمهورية أذربيجان;أذربيجان};{Republik Azerbaidjan;Azerbaidjan};{Ázerbájdžánská republika;Ázerbájdžán};{Republik Aserbaidschan;Aserbaidschan};{Aserbaidžaani Vabariik;Aserbaidžaan};{Azerbaidzanin tasavalta;Azerbaidzan};{publique d'Azerbaïdjan;Azerbaïdjan};{Republika Azerbajdžan;Azerbajdžan};{Azerbajdzsán;Azerbajdzsán};{Repubblica dell'Azerbaigian;Azerbaijan};{バイジャン共和国;バイジャン};{;};{Republiek Azerbeidzjan;Azerbeidzjan};{جمهوری آذربایجان;جمهوری آذربایجان};{Republika Azerbejdżanu;Azerbejdżan};{República do Azerbaijão;Azerbeijão};{Азербайджанская Республика;Азербайджан};{Azerbajanská republika;Azerbajan};{República de Azerbaiyán;Azerbaiyán};{Republika Azerbejdžan;Azerbejdžan};{Republiken Azerbajdzjan;Azerbajdzjan};{Azerbaycan Cumhuriyeti;Azerbaycan};{جمہوریہ آذربائیجان;آذربائیجان};{共和国;}};[40.5;47.5];true;[ARM;GEO;IRN;RUS;TUR];86600;🇦🇿;{{Azerbaijani;Azerbaijani};{Azerbaïdjanaise;Azerbaïdjanais}}↵
{Burundi;Republic of Burundi;{fra:{official:publique du Burundi;common:Burundi};run:{official:Republika y'Uburundi ;common:Uburundi}}};[.bi];BI;108;BDI;BDI;true;officially-assigned;true;African Group;{BIF:{name:Burundian franc;symbol:Fr}};{+2;[57]};[Gitega];[BI;Republic of Burundi;Republika y'Uburundi;publique du Burundi];Africa;Eastern Africa;{fra:French;run:Kirundi};{{جمهورية بوروندي;بوروندي};{Republik Burundi;Burundi};{Burundská republika;Burundi};{Republik Burundi;Burundi};{Burundi Vabariik;Burundi};{Burundin tasavalta;Burundi};{publique du Burundi;Burundi};{Burundi;Burundi};{Burundi;Burundi};{Repubblica del Burundi;Burundi};{ブル共和国;ブル};{;};{Republiek Burundi;Burundi};{جمهوری بوروندی;بوروندی};{Republika Burundi;Burundi};{República do Burundi;Burundi};{Республика Бурунди;Бурунди};{Burundská republika;Burundi};{República de Burundi;Burundi};{Republika Burundi;Burundi};{Republiken Burundi;Burundi};{Burundi Cumhuriyeti;Burundi};{جمہوریہ برونڈی;برونڈی};{共和国;}};[-3.5;30];true;[COD;RWA;TZA];27834;🇧🇮;{{Burundian;Burundian};{Burundaise;Burundais}}↵
{Belgium;Kingdom of Belgium;{deu:{official:Königreich Belgien;common:Belgien};fra:{official:Royaume de Belgique;common:Belgique};nld:{official:Koninkrijk België;common:België}}};[.be];BE;056;BEL;BEL;true;officially-assigned;true;Western European and Others Group;{EUR:{name:Euro;symbol:}};{+3;[2]};[Brussels];[BE;België;Belgie;Belgien;Belgique;Kingdom of Belgium;Koninkrijk België;Royaume de Belgique;Königreich Belgien];Europe;Western Europe;{deu:German;fra:French;nld:Dutch};{{مملكة بلجيكا;بلجيكا};{Rouantelezh Belgia;Belgia};{Belgické královst;Belgie};{Königreich Belgien;Belgien};{Belgia Kuningriik;Belgia};{Belgian kuningaskunta;Belgia};{Royaume de Belgique;Belgique};{Kraljevina Belgija;Belgija};{Belga Királyság;Belgium};{Regno del Belgio;Belgio};{ベル王国;ベル};{기에;기에};{Koninkrijk België;België};{پادشاهی بلژیک;بلژیک};{Królestwo Belgii;Belgia};{Reino da Bélgica;Bélgica};{Королевство Бельгия;Бельгия};{Belgické kráľovstvo;Belgicko};{Reino de Bélgica;Bélgica};{Kraljevina Belgija;Belgija};{Konungariket Belgien;Belgien};{Belçika Krallığı;Belçika};{مملکتِ بلجئیم;بلجئیم};{比利时王国;比利时}};[50.83333333;4];false;[FRA;DEU;LUX;NLD];30528;🇧🇪;{{Belgian;Belgian};{Belge;Belge}}↵
{Benin;Republic of Benin;{fra:{official:publique du Bénin;common:Bénin}}};[.bj];BJ;204;BEN;BEN;true;officially-assigned;true;African Group;{XOF:{name:West African CFA franc;symbol:Fr}};{+2;[29]};[Porto-Novo];[BJ;Republic of Benin;publique du Bénin];Africa;Western Africa;{fra:French};{{جمهورية بنين;بنين};{Republik Benin;Benin};{Beninská republika;Benin};{Republik Benin;Benin};{Benini Vabariik;Benin};{Beninin tasavalta;Benin};{publique du Bénin;Bénin};{Republika Benin;Benin};{Beniniztársaság;Benin};{Repubblica del Benin;Benin};{ナン共和国;ナン};{;};{Republiek Benin;Benin};{جمهوری بنین;بنین};{Benin;Benin};{República do Benin;Benin};{Республика Бенин;Бенин};{Beninská republika;Benin};{República de Benin;Benín};{Republika Benin;Benin};{Republiken Benin;Benin};{Benin Cumhuriyeti;Benin};{جمہوریہ بینن;بینن};{共和国;}};[9.5;2.25];false;[BFA;NER;NGA;TGO];112622;🇧🇯;{{Beninese;Beninese};{Béninoise;Béninois}}↵
{Burkina Faso;Burkina Faso;{fra:{official:publique du Burkina;common:Burkina Faso}}};[.bf];BF;854;BFA;BUR;true;officially-assigned;true;African Group;{XOF:{name:West African CFA franc;symbol:Fr}};{+2;[26]};[Ouagadougou];[BF];Africa;Western Africa;{fra:French};{{بوركينا فاسو;بوركينا فاسو};{Burkina Faso;Burkina Faso};{Burkina Faso;Burkina Faso};{Burkina Faso;Burkina Faso};{Burkina Faso;Burkina Faso};{Burkina Faso;Burkina Faso};{publique du Burkina;Burkina Faso};{Burkina Faso;Burkina Faso};{Burkina Faso;Burkina};{Burkina Faso;Burkina Faso};{ブルファ;ブルファ};{;};{Burkina Faso;Burkina Faso};{بورکینافاسو;بورکینافاسو};{Burkina Faso;Burkina Faso};{Burkina Faso;Burkina Faso};{Буркина -Фасо;Буркина-Фасо};{Burkina Faso;Burkina Faso};{Burkina Faso;Burkina Faso};{Burkina Faso;Burkina Faso};{Burkina Faso;Burkina Faso};{Burkina Faso;Burkina Faso};{برکینا فاسو;برکینا فاسو};{;}};[13;-2];true;[BEN;CIV;GHA;MLI;NER;TGO];272967;🇧🇫;{{Burkinabe;Burkinabe};{Burkinabée;Burkinabé}}↵
{Bangladesh;People's Republic of Bangladesh;{ben:{official:া�া�্�া�্�্�;common:া�া�}}};[.bd];BD;050;BGD;BAN;true;officially-assigned;true;Asia and the Pacific Group;{BDT:{name:Bangladeshi taka;symbol:}};{+8;[80]};[Dhaka];[BD;People's Republic of Bangladesh;Gônôprôjatôntri Bangladesh];Asia;Southern Asia;{ben:Bengali};{{جمهورية بنغلاديش الشعبية;بنغلاديش};{Republik pobl Bangladesh;Bangladesh};{Bangladéšská lidová republika;Bangladéš};{Volksrepublik Bangladesch;Bangladesch};{Bangladeshi Rahvavabariik;Bangladesh};{Bangladeshin kansantasavalta;Bangladesh};{Lapublique populaire du Bangladesh;Bangladesh};{Narodna Republika Bangladeš;Bangladeš};{Banglades;Banglades};{Repubblica popolare del Bangladesh;Bangladesh};{ングシュ人民共和国;ングシュ};{;};{Volksrepubliek Bangladesh;Bangladesh};{جمهوری خلق بنگلادش;بنگلادش};{Ludowa Republika Bangladeszu;Bangladesz};{República Popular do Bangladesh;Bangladesh};{Народная Республика Бангладеш;Бангладеш};{Bangladéšskaudová republika;Bangladéš};{República Popular de Bangladesh;Bangladesh};{Narodna Republika Bangladeš;Bangladeš};{Folkrepubliken Bangladesh;Bangladesh};{Bangladeş Halk Cumhuriyeti;Bangladeş};{عوامی جمہوریہ بنگلہ دیش;بنگلہ دیش};{人民共和国;}};[24;90];false;[MMR;IND];147570;🇧🇩;{{Bangladeshi;Bangladeshi};{Bangladaise;Bangladais}}↵
{Bulgaria;Republic of Bulgaria;{bul:{official:Република България;common:България}}};[.bg];BG;100;BGR;BUL;true;officially-assigned;true;Eastern European Group;{BGN:{name:Bulgarian lev;symbol:лв}};{+3;[59]};[Sofia];[BG;Republic of Bulgaria;Република България];Europe;Southeast Europe;{bul:Bulgarian};{{جمهورية بلغاريا;بلغاريا};{Republik Bulgaria;Bulgaria};{Bulharská republika;Bulharsko};{Republik Bulgarien;Bulgarien};{Bulgaaria Vabariik;Bulgaaria};{Bulgarian tasavalta;Bulgaria};{publique de Bulgarie;Bulgarie};{Republika Bugarska;Bugarska};{Bolgárztársaság;Bulgária};{Repubblica di Bulgaria;Bulgaria};{ブルリア共和国;ブルリア};{;};{Republiek Bulgarije;Bulgarije};{جمهوری بلغارستان;بلغارستان};{Republika Bułgarii;Bułgaria};{República da Bulgária;Bulgária};{Республика Болгария;Болгария};{Bulharská republika;Bulharsko};{República de Bulgaria;Bulgaria};{Republika Bugarska;Bugarska};{Republiken Bulgarien;Bulgarien};{Bulgaristan Cumhuriyeti;Bulgaristan};{جمہوریہ بلغاریہ;بلغاریہ};{利亚共和国;利亚}};[43;25];false;[GRC;MKD;ROU;SRB;TUR];110879;🇧🇬;{{Bulgarian;Bulgarian};{Bulgare;Bulgare}}↵
{Bahrain;Kingdom of Bahrain;{ara:{official:مملكة البحرين;common:البحرين}}};[.bh];BH;048;BHR;BRN;true;officially-assigned;true;Asia and the Pacific Group;{BHD:{name:Bahraini dinar;symbol:.د.ب}};{+9;[73]};[Manama];[BH;Kingdom of Bahrain;Mamlakat al-Barayn];Asia;Western Asia;{ara:Arabic};{{مملكة البحرين;البحرين};{Rouantelezh Bahrein;Bahrein};{Klovst Bahrajn;Bahrajn};{Königreich Bahrain;Bahrain};{Bahreini Kuningriik;Bahrein};{Bahrainin kuningaskunta;Bahrain};{Royaume de Bahreïn;Bahreïn};{Kraljevina Bahrein;Bahrein};{Bahreini Királyság;Bahrein};{Regno del Bahrain;Bahrein};{ー�ーン王国;ー�ーン};{;};{Koninkrijk Bahrein;Bahrein};{پادشاهی بحرین;بحرین};{Królestwo Bahrajnu;Bahrajn};{Reino do Bahrein;Bahrein};{Королевство Бахрейн;Бахрейн};{Bahrajnské kráľovstvo;Bahrajn};{Reino de Bahrein;Bahrein};{Kraljevina Bahrein;Bahrein};{Konungariket Bahrain;Bahrain};{Bahreyn Krallığı;Bahreyn};{مملکتِ بحرین;بحرین};{王国;}};[26;50.55];false;[];765;🇧🇭;{{Bahraini;Bahraini};{Bahreïnienne;Bahreïnien}}
... (truncated)
large_non_uniform_nested_mixed.json — Original: 2402 chars — Tokenizer: qwen2.5 (Qwen/Qwen2.5-0.5B)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)2,4028162.92.9
JSON (min)1,5004495.33.3
CSVN/A
TSVN/A
YAML1,5735594.32.8
TOON1,7665724.23.1
TSON1,2754625.22.8
minemizer1,2034006.03.0
minemizer (compact)1,0723826.32.8
JSON (pretty)
chars: 2,402 tokens: 816 chars_og/tok: 2.9 enc_chars/tok: 2.9
[↵
· {↵
··· "id":·1,↵
··· "name": "Alice",↵
··· "work": {↵
····· "title": "Senior Engineer",↵
····· "years":·5,↵
····· "remote": true,↵
····· "team": "Platform"↵
··· },↵
··· "contact": {↵
····· "email": "alice@co.com"↵
··· }↵
· },↵
· {↵
··· "id":·2,↵
··· "profile": {↵
····· "age":·28,↵
····· "city": "NYC",↵
····· "verified": true
··· },↵
··· "status": "active",↵
··· "permissions": {↵
····· "admin": false,↵
····· "editor": true
... (truncated)
JSON (min)
chars: 1,500 tokens: 449 chars_og/tok: 5.3 enc_chars/tok: 3.3
[{"id":1,"name":"Alice","work":{"title":"Senior Engineer","years":5,"remote":true,"team":"Platform"},"contact":{"email":"alice@co.com"}},{"id":2,"profile":{"age":28,"city":"NYC","verified":true},"status":"active","permissions":{"admin":false,"editor":true}},{"id":3,"name":"Charlie","contact":{"email":"c@example.com","preferred":"email","phone":"555-0103"},"metadata":{"created":"2019-06-10"}},{"id":4,"user":{"username":"diana","role":"admin","level":5},"metadata":{"created":"2020-09-01","updated":"2024-01-20"},"settings":{"theme":"dark"}},{"id":5,"employee":{"name":"Eve Adams","department":"Sales"},"performance":{"score":85,"reviews":3},"contact":{"email":"eve@co.com","slack":"@eve"}},{"id":6,"name":"Frank","work":{"title":"Product Manager","years":8,"remote":false,"team":"Growth"},"contact":{"email":"frank@co.com","phone":"555-0106"}},{"id":7,"profile":{"age":35,"city":"LA","verified":false},"status":"inactive","permissions":{"admin":true,"editor":false},"metadata":{"created":"2018-03-15"}},{"id":8,"name":"Grace","contact":{"email":"grace@example.org","preferred":"slack","slack":"@grace"},"settings":{"theme":"light","notifications":true}},{"id":9,"user":{"username":"henry","role":"viewer","level":2},"employee":{"name":"Henry Wilson","department":"Marketing"},"performance":{"score":72,"reviews":5}},{"id":10,"name":"Iris","work":{"title":"Designer","years":3,"remote":true,"team":"Creative"},"profile":{"age":26,"city":"Austin","verified":true},"contact":{"email":"iris@co.com"}}]
CSV: N/A
TSV: N/A
YAML
chars: 1,573 tokens: 559 chars_og/tok: 4.3 enc_chars/tok: 2.8
- contact:↵
··· email: alice@co.com
· id:·1
· name: Alice
· work:↵
··· remote: true
··· team: Platform
··· title: Senior Engineer
··· years:·5
- id:·2
· permissions:↵
··· admin: false
··· editor: true
· profile:↵
··· age:·28
··· city: NYC
··· verified: true
· status: active
- contact:↵
··· email: c@example.com
··· phone:·555-0103
··· preferred: email
· id:·3
· metadata:↵
··· created: '2019-06-10'
... (truncated)
TOON
chars: 1,766 tokens: 572 chars_og/tok: 4.2 enc_chars/tok: 3.1
[10]:↵
· - id:·1
··· name: Alice
··· work:↵
····· title: Senior Engineer
····· years:·5
····· remote: true
····· team: Platform
··· contact:↵
····· email: alice@co.com
· - id:·2
··· profile:↵
····· age:·28
····· city: NYC
····· verified: true
··· status: active
··· permissions:↵
····· admin: false
····· editor: true
· - id:·3
··· name: Charlie
··· contact:↵
····· email: c@example.com
····· preferred: email
····· phone:·555-0103
... (truncated)
TSON
chars: 1,275 tokens: 462 chars_og/tok: 5.2 enc_chars/tok: 2.8
[{@id,name,work,contact|1,Alice,{@title,years,remote,team|"Senior Engineer",5,true,Platform},{@email|"alice@co.com"}},{@id,profile,status,permissions|2,{@age,city,verified|28,NYC,true},active,{@admin,editor|false,true}},{@id,name,contact,metadata|3,Charlie,{@email,preferred,phone|"c@example.com",email,555-0103},{@created|2019-06-10}},{@id,user,metadata,settings|4,{@username,role,level|diana,admin,5},{@created,updated|2020-09-01,2024-01-20},{@theme|dark}},{@id,employee,performance,contact|5,{@name,department|"Eve Adams",Sales},{@score,reviews|85,3},{@email,slack|"eve@co.com","@eve"}},{@id,name,work,contact|6,Frank,{@title,years,remote,team|"Product Manager",8,false,Growth},{@email,phone|"frank@co.com",555-0106}},{@id,profile,status,permissions,metadata|7,{@age,city,verified|35,LA,false},inactive,{@admin,editor|true,false},{@created|2018-03-15}},{@id,name,contact,settings|8,Grace,{@email,preferred,slack|"grace@example.org",slack,"@grace"},{@theme,notifications|light,true}},{@id,user,employee,performance|9,{@username,role,level|henry,viewer,2},{@name,department|"Henry Wilson",Marketing},{@score,reviews|72,5}},{@id,name,work,profile,contact|10,Iris,{@title,years,remote,team|Designer,3,true,Creative},{@age,city,verified|26,Austin,true},{@email|"iris@co.com"}}]
minemizer
chars: 1,203 tokens: 400 chars_og/tok: 6.0 enc_chars/tok: 3.0
id; name; contact{ email; ...}↵
1; Alice;{ alice@co.com}; work{ title: Senior Engineer; years:·5; remote:true; team: Platform}↵
2;;; profile{ age:·28; city: NYC; verified:true}; status: active; permissions{ admin:false; editor:true}↵
3; Charlie;{ c@example.com; preferred: email; phone:·555-0103}; metadata{ created:·2019-06-10}↵
4;;; user{ username: diana; role: admin; level:·5}; metadata{ created:·2020-09-01; updated:·2024-01-20}; settings{ theme: dark}↵
5;;{ eve@co.com; slack: @eve}; employee{ name: Eve Adams; department: Sales}; performance{ score:·85; reviews:·3}↵
6; Frank;{ frank@co.com; phone:·555-0106}; work{ title: Product Manager; years:·8; remote:false; team: Growth}↵
7;;; profile{ age:·35; city: LA; verified:false}; status: inactive; permissions{ admin:true; editor:false}; metadata{ created:·2018-03-15}↵
8; Grace;{ grace@example.org; preferred: slack; slack: @grace}; settings{ theme: light; notifications:true}↵
9;;; user{ username: henry; role: viewer; level:·2}; employee{ name: Henry Wilson; department: Marketing}; performance{ score:·72; reviews:·5}↵
10; Iris;{ iris@co.com}; work{ title: Designer; years:·3; remote:true; team: Creative}; profile{ age:·26; city: Austin; verified:true}
minemizer (compact)
chars: 1,072 tokens: 382 chars_og/tok: 6.3 enc_chars/tok: 2.8
id;name;contact{email;...}↵
1;Alice;{alice@co.com};work{title:Senior Engineer;years:5;remote:true;team:Platform}↵
2;;;profile{age:28;city:NYC;verified:true};status:active;permissions{admin:false;editor:true}↵
3;Charlie;{c@example.com;preferred:email;phone:555-0103};metadata{created:2019-06-10}↵
4;;;user{username:diana;role:admin;level:5};metadata{created:2020-09-01;updated:2024-01-20};settings{theme:dark}↵
5;;{eve@co.com;slack:@eve};employee{name:Eve Adams;department:Sales};performance{score:85;reviews:3}↵
6;Frank;{frank@co.com;phone:555-0106};work{title:Product Manager;years:8;remote:false;team:Growth}↵
7;;;profile{age:35;city:LA;verified:false};status:inactive;permissions{admin:true;editor:false};metadata{created:2018-03-15}↵
8;Grace;{grace@example.org;preferred:slack;slack:@grace};settings{theme:light;notifications:true}↵
9;;;user{username:henry;role:viewer;level:2};employee{name:Henry Wilson;department:Marketing};performance{score:72;reviews:5}↵
10;Iris;{iris@co.com};work{title:Designer;years:3;remote:true;team:Creative};profile{age:26;city:Austin;verified:true}
large_non_uniform_nested_numerical.json — Original: 2947 chars — Tokenizer: qwen2.5 (Qwen/Qwen2.5-0.5B)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)2,9471,3322.22.2
JSON (min)1,8738843.32.1
CSVN/A
TSVN/A
YAML2,0851,0772.71.9
TOON2,3181,0902.72.1
TSON1,6429073.21.8
minemizer1,5348833.31.7
minemizer (compact)1,3618093.61.7
JSON (pretty)
chars: 2,947 tokens: 1,332 chars_og/tok: 2.2 enc_chars/tok: 2.2
[↵
· {↵
··· "id":·1,↵
··· "metrics": {↵
····· "views":·15420,↵
····· "clicks":·842,↵
····· "ctr":·0.0546,↵
····· "bounce_rate":·0.32
··· },↵
··· "revenue": {↵
····· "amount":·12499.99,↵
····· "currency_rate":·1.0
··· },↵
··· "timestamp": "2024-01-15T09:30:00Z"↵
· },↵
· {↵
··· "id":·2,↵
··· "metrics": {↵
····· "views":·8923,↵
····· "clicks":·156,↵
····· "ctr":·0.0175,↵
····· "bounce_rate":·0.67
··· },↵
··· "stats": {↵
····· "avg_time":·45.7,
... (truncated)
JSON (min)
chars: 1,873 tokens: 884 chars_og/tok: 3.3 enc_chars/tok: 2.1
[{"id":1,"metrics":{"views":15420,"clicks":842,"ctr":0.0546,"bounce_rate":0.32},"revenue":{"amount":12499.99,"currency_rate":1.0},"timestamp":"2024-01-15T09:30:00Z"},{"id":2,"metrics":{"views":8923,"clicks":156,"ctr":0.0175,"bounce_rate":0.67},"stats":{"avg_time":45.7,"pages_per_session":2.3,"return_rate":0.15},"timestamp":"2024-01-16T14:22:33Z"},{"id":3,"revenue":{"amount":8750.5,"tax":700.04,"net":8050.46,"currency_rate":0.92},"inventory":{"count":342,"reserved":28,"available":314}},{"id":4,"metrics":{"views":52100,"clicks":3891,"ctr":0.0747,"bounce_rate":0.21},"performance":{"latency_ms":127.5,"uptime":0.9987,"errors":3},"timestamp":"2024-01-17T08:00:00Z"},{"id":5,"stats":{"avg_time":128.9,"pages_per_session":5.7,"return_rate":0.42},"scores":{"quality":94,"relevance":87,"engagement":0.78},"dates":{"start":"2023-06-01","end":"2024-01-31"}},{"id":6,"inventory":{"count":1205,"reserved":89,"available":1116,"reorder_point":200},"pricing":{"cost":24.99,"markup":0.35,"price":33.74},"timestamp":"2024-01-18T11:45:12Z"},{"id":7,"metrics":{"views":3156,"clicks":98,"ctr":0.031,"bounce_rate":0.55},"revenue":{"amount":2150.0,"tax":172.0,"net":1978.0},"performance":{"latency_ms":89.2,"uptime":0.9995,"errors":0}},{"id":8,"scores":{"quality":78,"relevance":92,"engagement":0.65,"nps":45},"dates":{"start":"2022-11-15","end":"2024-02-28","renewal":"2024-03-01"},"budget":{"allocated":50000,"spent":42350.75,"remaining":7649.25}},{"id":9,"pricing":{"cost":149.99,"markup":0.28,"price":191.99,"discount":0.1},"inventory":{"count":56,"reserved":12,"available":44},"timestamp":"2024-01-19T16:30:45Z"},{"id":10,"metrics":{"views":128750,"clicks":9823,"ctr":0.0763,"bounce_rate":0.18},"stats":{"avg_time":312.4,"pages_per_session":8.2,"return_rate":0.58},"budget":{"allocated":125000,"spent":98420.33,"remaining":26579.67},"dates":{"start":"2023-01-01","end":"2024-12-31"}}]
CSV: N/A
TSV: N/A
YAML
chars: 2,085 tokens: 1,077 chars_og/tok: 2.7 enc_chars/tok: 1.9
- id:·1
· metrics:↵
··· bounce_rate:·0.32
··· clicks:·842
··· ctr:·0.0546
··· views:·15420
· revenue:↵
··· amount:·12499.99
··· currency_rate:·1.0
· timestamp: '2024-01-15T09:30:00Z'↵
- id:·2
· metrics:↵
··· bounce_rate:·0.67
··· clicks:·156
··· ctr:·0.0175
··· views:·8923
· stats:↵
··· avg_time:·45.7
··· pages_per_session:·2.3
··· return_rate:·0.15
· timestamp: '2024-01-16T14:22:33Z'↵
- id:·3
· inventory:↵
··· available:·314
··· count:·342
... (truncated)
TOON
chars: 2,318 tokens: 1,090 chars_og/tok: 2.7 enc_chars/tok: 2.1
[10]:↵
· - id:·1
··· metrics:↵
····· views:·15420
····· clicks:·842
····· ctr:·0.0546
····· bounce_rate:·0.32
··· revenue:↵
····· amount:·12499.99
····· currency_rate:·1.0
··· timestamp: "2024-01-15T09:30:00Z"↵
· - id:·2
··· metrics:↵
····· views:·8923
····· clicks:·156
····· ctr:·0.0175
····· bounce_rate:·0.67
··· stats:↵
····· avg_time:·45.7
····· pages_per_session:·2.3
····· return_rate:·0.15
··· timestamp: "2024-01-16T14:22:33Z"↵
· - id:·3
··· revenue:↵
····· amount:·8750.5
... (truncated)
TSON
chars: 1,642 tokens: 907 chars_og/tok: 3.2 enc_chars/tok: 1.8
[{@id,metrics,revenue,timestamp|1,{@views,clicks,ctr,bounce_rate|15420,842,0.0546,0.32},{@amount,currency_rate|12499.99,1.0},2024-01-15T09:30:00Z},{@id,metrics,stats,timestamp|2,{@views,clicks,ctr,bounce_rate|8923,156,0.0175,0.67},{@avg_time,pages_per_session,return_rate|45.7,2.3,0.15},2024-01-16T14:22:33Z},{@id,revenue,inventory|3,{@amount,tax,net,currency_rate|8750.5,700.04,8050.46,0.92},{@count,reserved,available|342,28,314}},{@id,metrics,performance,timestamp|4,{@views,clicks,ctr,bounce_rate|52100,3891,0.0747,0.21},{@latency_ms,uptime,errors|127.5,0.9987,3},2024-01-17T08:00:00Z},{@id,stats,scores,dates|5,{@avg_time,pages_per_session,return_rate|128.9,5.7,0.42},{@quality,relevance,engagement|94,87,0.78},{@start,end|2023-06-01,2024-01-31}},{@id,inventory,pricing,timestamp|6,{@count,reserved,available,reorder_point|1205,89,1116,200},{@cost,markup,price|24.99,0.35,33.74},2024-01-18T11:45:12Z},{@id,metrics,revenue,performance|7,{@views,clicks,ctr,bounce_rate|3156,98,0.031,0.55},{@amount,tax,net|2150.0,172.0,1978.0},{@latency_ms,uptime,errors|89.2,0.9995,0}},{@id,scores,dates,budget|8,{@quality,relevance,engagement,nps|78,92,0.65,45},{@start,end,renewal|2022-11-15,2024-02-28,2024-03-01},{@allocated,spent,remaining|50000,42350.75,7649.25}},{@id,pricing,inventory,timestamp|9,{@cost,markup,price,discount|149.99,0.28,191.99,0.1},{@count,reserved,available|56,12,44},2024-01-19T16:30:45Z},{@id,metrics,stats,budget,dates|10,{@views,clicks,ctr,bounce_rate|128750,9823,0.0763,0.18},{@avg_time,pages_per_session,return_rate|312.4,8.2,0.58},{@allocated,spent,remaining|125000,98420.33,26579.67},{@start,end|2023-01-01,2024-12-31}}]
minemizer
chars: 1,534 tokens: 883 chars_og/tok: 3.3 enc_chars/tok: 1.7
id; metrics{ views; clicks; ctr; bounce_rate}; timestamp
1;{·15420;·842;·0.0546;·0.32};·2024-01-15T09:30:00Z; revenue{ amount:·12499.99; currency_rate:·1.0}↵
2;{·8923;·156;·0.0175;·0.67};·2024-01-16T14:22:33Z; stats{ avg_time:·45.7; pages_per_session:·2.3; return_rate:·0.15}↵
3;;; revenue{ amount:·8750.5; tax:·700.04; net:·8050.46; currency_rate:·0.92}; inventory{ count:·342; reserved:·28; available:·314}↵
4;{·52100;·3891;·0.0747;·0.21};·2024-01-17T08:00:00Z; performance{ latency_ms:·127.5; uptime:·0.9987; errors:·3}↵
5;;; stats{ avg_time:·128.9; pages_per_session:·5.7; return_rate:·0.42}; scores{ quality:·94; relevance:·87; engagement:·0.78}; dates{ start:·2023-06-01; end:·2024-01-31}↵
6;;·2024-01-18T11:45:12Z; inventory{ count:·1205; reserved:·89; available:·1116; reorder_point:·200}; pricing{ cost:·24.99; markup:·0.35; price:·33.74}↵
7;{·3156;·98;·0.031;·0.55};; revenue{ amount:·2150.0; tax:·172.0; net:·1978.0}; performance{ latency_ms:·89.2; uptime:·0.9995; errors:·0}↵
8;;; scores{ quality:·78; relevance:·92; engagement:·0.65; nps:·45}; dates{ start:·2022-11-15; end:·2024-02-28; renewal:·2024-03-01}; budget{ allocated:·50000; spent:·42350.75; remaining:·7649.25}↵
9;;·2024-01-19T16:30:45Z; pricing{ cost:·149.99; markup:·0.28; price:·191.99; discount:·0.1}; inventory{ count:·56; reserved:·12; available:·44}↵
10;{·128750;·9823;·0.0763;·0.18};; stats{ avg_time:·312.4; pages_per_session:·8.2; return_rate:·0.58}; budget{ allocated:·125000; spent:·98420.33; remaining:·26579.67}; dates{ start:·2023-01-01; end:·2024-12-31}
minemizer (compact)
chars: 1,361 tokens: 809 chars_og/tok: 3.6 enc_chars/tok: 1.7
id;metrics{views;clicks;ctr;bounce_rate};timestamp
1;{15420;842;0.0546;0.32};2024-01-15T09:30:00Z;revenue{amount:12499.99;currency_rate:1.0}↵
2;{8923;156;0.0175;0.67};2024-01-16T14:22:33Z;stats{avg_time:45.7;pages_per_session:2.3;return_rate:0.15}↵
3;;;revenue{amount:8750.5;tax:700.04;net:8050.46;currency_rate:0.92};inventory{count:342;reserved:28;available:314}↵
4;{52100;3891;0.0747;0.21};2024-01-17T08:00:00Z;performance{latency_ms:127.5;uptime:0.9987;errors:3}↵
5;;;stats{avg_time:128.9;pages_per_session:5.7;return_rate:0.42};scores{quality:94;relevance:87;engagement:0.78};dates{start:2023-06-01;end:2024-01-31}↵
6;;2024-01-18T11:45:12Z;inventory{count:1205;reserved:89;available:1116;reorder_point:200};pricing{cost:24.99;markup:0.35;price:33.74}↵
7;{3156;98;0.031;0.55};;revenue{amount:2150.0;tax:172.0;net:1978.0};performance{latency_ms:89.2;uptime:0.9995;errors:0}↵
8;;;scores{quality:78;relevance:92;engagement:0.65;nps:45};dates{start:2022-11-15;end:2024-02-28;renewal:2024-03-01};budget{allocated:50000;spent:42350.75;remaining:7649.25}↵
9;;2024-01-19T16:30:45Z;pricing{cost:149.99;markup:0.28;price:191.99;discount:0.1};inventory{count:56;reserved:12;available:44}↵
10;{128750;9823;0.0763;0.18};;stats{avg_time:312.4;pages_per_session:8.2;return_rate:0.58};budget{allocated:125000;spent:98420.33;remaining:26579.67};dates{start:2023-01-01;end:2024-12-31}
large_non_uniform_nested_text.json — Original: 4214 chars — Tokenizer: qwen2.5 (Qwen/Qwen2.5-0.5B)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)4,2149974.24.2
JSON (min)3,3596346.65.3
CSVN/A
TSVN/A
YAML3,3877165.94.7
TOON3,5347185.94.9
TSON3,1736446.54.9
minemizer2,8095108.35.5
minemizer (compact)2,6945347.95.0
JSON (pretty)
chars: 4,214 tokens: 997 chars_og/tok: 4.2 enc_chars/tok: 4.2
[↵
· {↵
··· "id":·1,↵
··· "title": "Introduction to Machine Learning",↵
··· "author": {↵
····· "name": "Dr. Sarah Chen",↵
····· "affiliation": "Stanford University",↵
····· "department": "Computer Science"↵
··· },↵
··· "abstract": "A comprehensive overview of modern machine learning techniques and applications",↵
··· "tags": [↵
····· "AI",↵
····· "ML",↵
····· "deep learning"↵
··· ]↵
· },↵
· {↵
··· "id":·2,↵
··· "title": "Climate Change Impact Assessment",↵
··· "content": {↵
····· "summary": "Analysis of rising sea levels and temperature patterns",↵
····· "methodology": "longitudinal study with satellite imagery",↵
····· "conclusion": "significant acceleration observed since·2010"↵
··· },↵
··· "category": "Environmental Science"
... (truncated)
JSON (min)
chars: 3,359 tokens: 634 chars_og/tok: 6.6 enc_chars/tok: 5.3
[{"id":1,"title":"Introduction to Machine Learning","author":{"name":"Dr. Sarah Chen","affiliation":"Stanford University","department":"Computer Science"},"abstract":"A comprehensive overview of modern machine learning techniques and applications","tags":["AI","ML","deep learning"]},{"id":2,"title":"Climate Change Impact Assessment","content":{"summary":"Analysis of rising sea levels and temperature patterns","methodology":"longitudinal study with satellite imagery","conclusion":"significant acceleration observed since·2010"},"category":"Environmental Science"},{"id":3,"author":{"name":"Marcus Williams","affiliation":"MIT Media Lab","role":"Principal Researcher"},"publication":{"journal":"Nature Communications","volume":"fifteen","status":"peer-reviewed"},"keywords":"quantum computing, error correction, fault tolerance"},{"id":4,"title":"Urban Planning Strategies for Sustainable Cities","abstract":"Examining green infrastructure and mixed-use development patterns","content":{"summary":"Case studies from Copenhagen, Singapore, and Portland","methodology":"comparative analysis with community surveys","findings":"walkability correlates strongly with resident satisfaction"},"tags":["urban design","sustainability","planning"]},{"id":5,"publication":{"journal":"The Lancet","volume":"four hundred two","issue":"special edition","status":"published"},"content":{"summary":"Global health outcomes following pandemic response measures","conclusion":"early intervention strategies proved most effective"},"category":"Public Health"},{"id":6,"title":"Advances in Natural Language Processing","author":{"name":"Dr. James Rodriguez","affiliation":"Google Research","department":"Language Understanding"},"abstract":"Survey of transformer architectures and attention mechanisms in modern NLP systems","keywords":"transformers, attention, language models, BERT, GPT"},{"id":7,"content":{"summary":"Historical analysis of economic policy shifts in emerging markets","methodology":"archival research combined with econometric modeling","findings":"trade liberalization showed mixed results across regions","limitations":"data availability constraints for pre-1990 period"},"category":"Economics","tags":["policy","trade","development"]},{"id":8,"title":"Biodiversity Conservation in Tropical Rainforests","author":{"name":"Dr. Ana Costa","affiliation":"Brazilian Institute for Amazonian Research","role":"Lead Ecologist"},"publication":{"journal":"Conservation Biology","status":"under review"},"abstract":"Mapping species distribution patterns and identifying critical habitat corridors"},{"id":9,"title":"Behavioral Economics and Consumer Decision Making","content":{"summary":"Experimental studies on cognitive biases in purchasing behavior","methodology":"randomized controlled trials with eye-tracking technology","conclusion":"anchoring effects persist even with expert consumers"},"keywords":"behavioral economics, decision theory, consumer psychology","category":"Psychology"},{"id":10,"author":{"name":"Prof. Michael Thompson","affiliation":"Oxford University","department":"Engineering Science","role":"Department Chair"},"publication":{"journal":"Advanced Materials","volume":"thirty-six","status":"accepted"},"abstract":"Novel synthesis methods for high-performance ceramic composites","tags":["materials science","ceramics","nanotechnology"]}]
CSV: N/A
TSV: N/A
YAML
chars: 3,387 tokens: 716 chars_og/tok: 5.9 enc_chars/tok: 4.7
- abstract: A comprehensive overview of modern machine learning techniques and applications
· author:↵
··· affiliation: Stanford University
··· department: Computer Science
··· name: Dr. Sarah Chen
· id:·1
· tags:↵
· - AI
· - ML
· - deep learning
· title: Introduction to Machine Learning
- category: Environmental Science
· content:↵
··· conclusion: significant acceleration observed since·2010
··· methodology: longitudinal study with satellite imagery
··· summary: Analysis of rising sea levels and temperature patterns
· id:·2
· title: Climate Change Impact Assessment
- author:↵
··· affiliation: MIT Media Lab
··· name: Marcus Williams
··· role: Principal Researcher
· id:·3
· keywords: quantum computing, error correction, fault tolerance
· publication:
... (truncated)
TOON
chars: 3,534 tokens: 718 chars_og/tok: 5.9 enc_chars/tok: 4.9
[10]:↵
· - id:·1
··· title: Introduction to Machine Learning
··· author:↵
····· name: Dr. Sarah Chen
····· affiliation: Stanford University
····· department: Computer Science
··· abstract: A comprehensive overview of modern machine learning techniques and applications
··· tags[3]: AI,ML,deep learning
· - id:·2
··· title: Climate Change Impact Assessment
··· content:↵
····· summary: Analysis of rising sea levels and temperature patterns
····· methodology: longitudinal study with satellite imagery
····· conclusion: significant acceleration observed since·2010
··· category: Environmental Science
· - id:·3
··· author:↵
····· name: Marcus Williams
····· affiliation: MIT Media Lab
····· role: Principal Researcher
··· publication:↵
····· journal: Nature Communications
····· volume: fifteen
····· status: peer-reviewed
... (truncated)
TSON
chars: 3,173 tokens: 644 chars_og/tok: 6.5 enc_chars/tok: 4.9
[{@id,title,author,abstract,tags|1,"Introduction to Machine Learning",{@name,affiliation,department|"Dr. Sarah Chen","Stanford University","Computer Science"},"A comprehensive overview of modern machine learning techniques and applications",[AI,ML,"deep learning"]},{@id,title,content,category|2,"Climate Change Impact Assessment",{@summary,methodology,conclusion|"Analysis of rising sea levels and temperature patterns","longitudinal study with satellite imagery","significant acceleration observed since·2010"},"Environmental Science"},{@id,author,publication,keywords|3,{@name,affiliation,role|"Marcus Williams","MIT Media Lab","Principal Researcher"},{@journal,volume,status|"Nature Communications",fifteen,peer-reviewed},"quantum computing, error correction, fault tolerance"},{@id,title,abstract,content,tags|4,"Urban Planning Strategies for Sustainable Cities","Examining green infrastructure and mixed-use development patterns",{@summary,methodology,findings|"Case studies from Copenhagen, Singapore, and Portland","comparative analysis with community surveys","walkability correlates strongly with resident satisfaction"},["urban design",sustainability,planning]},{@id,publication,content,category|5,{@journal,volume,issue,status|"The Lancet","four hundred two","special edition",published},{@summary,conclusion|"Global health outcomes following pandemic response measures","early intervention strategies proved most effective"},"Public Health"},{@id,title,author,abstract,keywords|6,"Advances in Natural Language Processing",{@name,affiliation,department|"Dr. James Rodriguez","Google Research","Language Understanding"},"Survey of transformer architectures and attention mechanisms in modern NLP systems","transformers, attention, language models, BERT, GPT"},{@id,content,category,tags|7,{@summary,methodology,findings,limitations|"Historical analysis of economic policy shifts in emerging markets","archival research combined with econometric modeling","trade liberalization showed mixed results across regions","data availability constraints for pre-1990 period"},Economics,[policy,trade,development]},{@id,title,author,publication,abstract|8,"Biodiversity Conservation in Tropical Rainforests",{@name,affiliation,role|"Dr. Ana Costa","Brazilian Institute for Amazonian Research","Lead Ecologist"},{@journal,status|"Conservation Biology","under review"},"Mapping species distribution patterns and identifying critical habitat corridors"},{@id,title,content,keywords,category|9,"Behavioral Economics and Consumer Decision Making",{@summary,methodology,conclusion|"Experimental studies on cognitive biases in purchasing behavior","randomized controlled trials with eye-tracking technology","anchoring effects persist even with expert consumers"},"behavioral economics, decision theory, consumer psychology",Psychology},{@id,author,publication,abstract,tags|10,{@name,affiliation,department,role|"Prof. Michael Thompson","Oxford University","Engineering Science","Department Chair"},{@journal,volume,status|"Advanced Materials",thirty-six,accepted},"Novel synthesis methods for high-performance ceramic composites",["materials science",ceramics,nanotechnology]}]
minemizer
chars: 2,809 tokens: 510 chars_og/tok: 8.3 enc_chars/tok: 5.5
id; title; author{ name; affiliation; department; role}; abstract; content{ summary; methodology; conclusion; ...}↵
1; Introduction to Machine Learning;{ Dr. Sarah Chen; Stanford University; Computer Science;}; A comprehensive overview of modern machine learning techniques and applications;; tags[ AI; ML; deep learning]↵
2; Climate Change Impact Assessment;;;{ Analysis of rising sea levels and temperature patterns; longitudinal study with satellite imagery; significant acceleration observed since·2010}; category: Environmental Science
3;;{ Marcus Williams; MIT Media Lab;; Principal Researcher};;; publication{ journal: Nature Communications; volume: fifteen; status: peer-reviewed}; keywords: quantum computing, error correction, fault tolerance
4; Urban Planning Strategies for Sustainable Cities;; Examining green infrastructure and mixed-use development patterns;{ Case studies from Copenhagen, Singapore, and Portland; comparative analysis with community surveys;; findings: walkability correlates strongly with resident satisfaction}; tags[ urban design; sustainability; planning]↵
5;;;;{ Global health outcomes following pandemic response measures;; early intervention strategies proved most effective}; publication{ journal: The Lancet; volume: four hundred two; issue: special edition; status: published}; category: Public Health
6; Advances in Natural Language Processing;{ Dr. James Rodriguez; Google Research; Language Understanding;}; Survey of transformer architectures and attention mechanisms in modern NLP systems;; keywords: transformers, attention, language models, BERT, GPT
7;;;;{ Historical analysis of economic policy shifts in emerging markets; archival research combined with econometric modeling;; findings: trade liberalization showed mixed results across regions; limitations: data availability constraints for pre-1990 period}; category: Economics; tags[ policy; trade; development]↵
8; Biodiversity Conservation in Tropical Rainforests;{ Dr. Ana Costa; Brazilian Institute for Amazonian Research;; Lead Ecologist}; Mapping species distribution patterns and identifying critical habitat corridors;; publication{ journal: Conservation Biology; status: under review}↵
9; Behavioral Economics and Consumer Decision Making;;;{ Experimental studies on cognitive biases in purchasing behavior; randomized controlled trials with eye-tracking technology; anchoring effects persist even with expert consumers}; keywords: behavioral economics, decision theory, consumer psychology; category: Psychology
10;;{ Prof. Michael Thompson; Oxford University; Engineering Science; Department Chair}; Novel synthesis methods for high-performance ceramic composites;; publication{ journal: Advanced Materials; volume: thirty-six; status: accepted}; tags[ materials science; ceramics; nanotechnology]
minemizer (compact)
chars: 2,694 tokens: 534 chars_og/tok: 7.9 enc_chars/tok: 5.0
id;title;author{name;affiliation;department;role};abstract;content{summary;methodology;conclusion;...}↵
1;Introduction to Machine Learning;{Dr. Sarah Chen;Stanford University;Computer Science;};A comprehensive overview of modern machine learning techniques and applications;;tags[AI;ML;deep learning]↵
2;Climate Change Impact Assessment;;;{Analysis of rising sea levels and temperature patterns;longitudinal study with satellite imagery;significant acceleration observed since·2010};category:Environmental Science
3;;{Marcus Williams;MIT Media Lab;;Principal Researcher};;;publication{journal:Nature Communications;volume:fifteen;status:peer-reviewed};keywords:quantum computing, error correction, fault tolerance
4;Urban Planning Strategies for Sustainable Cities;;Examining green infrastructure and mixed-use development patterns;{Case studies from Copenhagen, Singapore, and Portland;comparative analysis with community surveys;;findings:walkability correlates strongly with resident satisfaction};tags[urban design;sustainability;planning]↵
5;;;;{Global health outcomes following pandemic response measures;;early intervention strategies proved most effective};publication{journal:The Lancet;volume:four hundred two;issue:special edition;status:published};category:Public Health
6;Advances in Natural Language Processing;{Dr. James Rodriguez;Google Research;Language Understanding;};Survey of transformer architectures and attention mechanisms in modern NLP systems;;keywords:transformers, attention, language models, BERT, GPT
7;;;;{Historical analysis of economic policy shifts in emerging markets;archival research combined with econometric modeling;;findings:trade liberalization showed mixed results across regions;limitations:data availability constraints for pre-1990 period};category:Economics;tags[policy;trade;development]↵
8;Biodiversity Conservation in Tropical Rainforests;{Dr. Ana Costa;Brazilian Institute for Amazonian Research;;Lead Ecologist};Mapping species distribution patterns and identifying critical habitat corridors;;publication{journal:Conservation Biology;status:under review}↵
9;Behavioral Economics and Consumer Decision Making;;;{Experimental studies on cognitive biases in purchasing behavior;randomized controlled trials with eye-tracking technology;anchoring effects persist even with expert consumers};keywords:behavioral economics, decision theory, consumer psychology;category:Psychology
10;;{Prof. Michael Thompson;Oxford University;Engineering Science;Department Chair};Novel synthesis methods for high-performance ceramic composites;;publication{journal:Advanced Materials;volume:thirty-six;status:accepted};tags[materials science;ceramics;nanotechnology]
mcp_tools_list.json — Original: 51663 chars — Tokenizer: qwen2.5 (Qwen/Qwen2.5-0.5B)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)51,66311,2104.64.6
JSON (min)30,7246,3688.14.8
CSVN/A
TSVN/A
YAML38,1397,9276.54.8
TOON38,3767,6706.75.0
TSON25,8785,8898.84.4
minemizer23,3835,3199.74.4
minemizer (compact)21,9125,11210.14.3
JSON (pretty)
chars: 51,663 tokens: 11,210 chars_og/tok: 4.6 enc_chars/tok: 4.6
[↵
· {↵
··· "inputSchema": {↵
····· "json": {↵
······· "properties": {↵
········· "body": {↵
··········· "description": "Comment content",↵
··········· "type": "string"↵
········· },↵
········· "issue_number": {↵
··········· "description": "Issue number to comment on",↵
··········· "type": "number"↵
········· },↵
········· "owner": {↵
··········· "description": "Repository owner",↵
··········· "type": "string"↵
········· },↵
········· "repo": {↵
··········· "description": "Repository name",↵
··········· "type": "string"↵
········· }↵
······· },↵
······· "required": [↵
········· "owner",↵
········· "repo",
... (truncated)
JSON (min)
chars: 30,724 tokens: 6,368 chars_og/tok: 8.1 enc_chars/tok: 4.8
[{"inputSchema":{"json":{"properties":{"body":{"description":"Comment content","type":"string"},"issue_number":{"description":"Issue number to comment on","type":"number"},"owner":{"description":"Repository owner","type":"string"},"repo":{"description":"Repository name","type":"string"}},"required":["owner","repo","issue_number","body"],"type":"object"}},"name":"add_issue_comment","description":"Add a comment to a specific issue in a GitHub repository."},{"inputSchema":{"json":{"properties":{"body":{"description":"The text of the review comment","type":"string"},"line":{"description":"The line of the blob in the pull request diff that the comment applies to. For multi-line comments, the last line of the range","type":"number"},"owner":{"description":"Repository owner","type":"string"},"path":{"description":"The relative path to the file that necessitates a comment","type":"string"},"pullNumber":{"description":"Pull request number","type":"number"},"repo":{"description":"Repository name","type":"string"},"side":{"description":"The side of the diff to comment on. LEFT indicates the previous state, RIGHT indicates the new state","enum":["LEFT","RIGHT"],"type":"string"},"startLine":{"description":"For multi-line comments, the first line of the range that the comment applies to","type":"number"},"startSide":{"description":"For multi-line comments, the starting side of the diff that the comment applies to. LEFT indicates the previous state, RIGHT indicates the new state","enum":["LEFT","RIGHT"],"type":"string"},"subjectType":{"description":"The level at which the comment is targeted","enum":["FILE","LINE"],"type":"string"}},"required":["owner","repo","pullNumber","path","body","subjectType"],"type":"object"}},"name":"add_pull_request_review_comment_to_pending_review","description":"Add a comment to the requester's latest pending pull request review, a pending review needs to already exist to call this (check with the user if not sure)."},{"inputSchema":{"json":{"properties":{"issueNumber":{"description":"Issue number","type":"number"},"owner":{"description":"Repository owner","type":"string"},"repo":{"description":"Repository name","type":"string"}},"required":["owner","repo","issueNumber"],"type":"object"}},"name":"assign_copilot_to_issue","description":"Assign Copilot to a specific issue in a GitHub repository.\n\nThis tool can help with the following outcomes:\n- a Pull Request created with source code changes to resolve the issue\n\n\nMore information can be found at:\n- https://docs.github.com/en/copilot/using-github-copilot/using-copilot-coding-agent-to-work-on-tasks/about-assigning-tasks-to-copilot\n"},{"inputSchema":{"json":{"properties":{"body":{"description":"Review comment text","type":"string"},"commitID":{"description":"SHA of commit to review","type":"string"},"event":{"description":"Review action to perform","enum":["APPROVE","REQUEST_CHANGES","COMMENT"],"type":"string"},"owner":{"description":"Repository owner","type":"string"},"pullNumber":{"description":"Pull request number","type":"number"},"repo":{"description":"Repository name","type":"string"}},"required":["owner","repo","pullNumber","body","event"],"type":"object"}},"name":"create_and_submit_pull_request_review","description":"Create and submit a review for a pull request without review comments."},{"inputSchema":{"json":{"properties":{"branch":{"description":"Name for new branch","type":"string"},"from_branch":{"description":"Source branch (defaults to repo default)","type":"string"},"owner":{"description":"Repository owner","type":"string"},"repo":{"description":"Repository name","type":"string"}},"required":["owner","repo","branch"],"type":"object"}},"name":"create_branch","description":"Create a new branch in a GitHub repository"},{"inputSchema":{"json":{"properties":{"assignees":{"description":"Usernames to assign to this issue","items":{"type":"string"},"type":"array"},"body":{"description":"Issue body content","type":"string"},"labels":{"description":"Labels to apply to this issue","items":{"type":"string"},"type":"array"},"milestone":{"description":"Milestone number","type":"number"},"owner":{"description":"Repository owner","type":"string"},"repo":{"description":"Repository name","type":"string"},"title":{"description":"Issue title","type":"string"}},"required":["owner","repo","title"],"type":"object"}},"name":"create_issue","description":"Create a new issue in a GitHub repository."},{"inputSchema":{"json":{"properties":{"branch":{"description":"Branch to create/update the file in","type":"string"},"content":{"description":"Content of the file","type":"string"},"message":{"description":"Commit message","type":"string"},"owner":{"description":"Repository owner (username or organization)","type":"string"},"path":{"description":"Path where to create/update the file","type":"string"},"repo":{"description":"Repository name","type":"string"},"sha":{"description":"SHA of file being replaced (for updates)","type":"string"}},"required":["ow
... (truncated)
CSV: N/A
TSV: N/A
YAML
chars: 38,139 tokens: 7,927 chars_og/tok: 6.5 enc_chars/tok: 4.8
- description: Add a comment to a specific issue in a GitHub repository.↵
· inputSchema:↵
··· json:↵
····· properties:↵
······· body:↵
········· description: Comment content
········· type: string
······· issue_number:↵
········· description: Issue number to comment on
········· type: number
······· owner:↵
········· description: Repository owner
········· type: string
······· repo:↵
········· description: Repository name
········· type: string
····· required:↵
····· - owner
····· - repo
····· - issue_number
····· - body
····· type: object
· name: add_issue_comment
- description: Add a comment to the requester's latest pending pull request review,↵
··· a pending review needs to already exist to call this (check with the user if not
... (truncated)
TOON
chars: 38,376 tokens: 7,670 chars_og/tok: 6.7 enc_chars/tok: 5.0
[51]:↵
· -↵
··· inputSchema:↵
····· json:↵
······· properties:↵
········· body:↵
··········· description: Comment content
··········· type: string
········· issue_number:↵
··········· description: Issue number to comment on
··········· type: number
········· owner:↵
··········· description: Repository owner
··········· type: string
········· repo:↵
··········· description: Repository name
··········· type: string
······· required[4]: owner,repo,issue_number,body
······· type: object
··· name: add_issue_comment
··· description: Add a comment to a specific issue in a GitHub repository.↵
· -↵
··· inputSchema:↵
····· json:↵
······· properties:
... (truncated)
TSON
chars: 25,878 tokens: 5,889 chars_og/tok: 8.8 enc_chars/tok: 4.4
{@inputSchema(@json),name,description#51|{{@properties,required,type|{@body,issue_number,owner,repo|{@description,type|"Comment content",string},{@description,type|"Issue number to comment on",number},{@description,type|"Repository owner",string},{@description,type|"Repository name",string}},[owner,repo,issue_number,body],object}},add_issue_comment,"Add a comment to a specific issue in a GitHub repository."|{{@properties,required,type|{@body,line,owner,path,pullNumber,repo,side,startLine,startSide,subjectType|{@description,type|"The text of the review comment",string},{@description,type|"The line of the blob in the pull request diff that the comment applies to. For multi-line comments, the last line of the range",number},{@description,type|"Repository owner",string},{@description,type|"The relative path to the file that necessitates a comment",string},{@description,type|"Pull request number",number},{@description,type|"Repository name",string},{@description,enum,type|"The side of the diff to comment on. LEFT indicates the previous state, RIGHT indicates the new state",[LEFT,RIGHT],string},{@description,type|"For multi-line comments, the first line of the range that the comment applies to",number},{@description,enum,type|"For multi-line comments, the starting side of the diff that the comment applies to. LEFT indicates the previous state, RIGHT indicates the new state",[LEFT,RIGHT],string},{@description,enum,type|"The level at which the comment is targeted",[FILE,LINE],string}},[owner,repo,pullNumber,path,body,subjectType],object}},add_pull_request_review_comment_to_pending_review,"Add a comment to the requester's latest pending pull request review, a pending review needs to already exist to call this (check with the user if not sure)."|{{@properties,required,type|{@issueNumber,owner,repo|{@description,type|"Issue number",number},{@description,type|"Repository owner",string},{@description,type|"Repository name",string}},[owner,repo,issueNumber],object}},assign_copilot_to_issue,"Assign Copilot to a specific issue in a GitHub repository.\n\nThis tool can help with the following outcomes:\n- a Pull Request created with source code changes to resolve the issue\n\n\nMore information can be found at:\n- https://docs.github.com/en/copilot/using-github-copilot/using-copilot-coding-agent-to-work-on-tasks/about-assigning-tasks-to-copilot\n"|{{@properties,required,type|{@body,commitID,event,owner,pullNumber,repo|{@description,type|"Review comment text",string},{@description,type|"SHA of commit to review",string},{@description,enum,type|"Review action to perform",[APPROVE,REQUEST_CHANGES,COMMENT],string},{@description,type|"Repository owner",string},{@description,type|"Pull request number",number},{@description,type|"Repository name",string}},[owner,repo,pullNumber,body,event],object}},create_and_submit_pull_request_review,"Create and submit a review for a pull request without review comments."|{{@properties,required,type|{@branch,from_branch,owner,repo|{@description,type|"Name for new branch",string},{@description,type|"Source branch (defaults to repo default)",string},{@description,type|"Repository owner",string},{@description,type|"Repository name",string}},[owner,repo,branch],object}},create_branch,"Create a new branch in a GitHub repository"|{{@properties,required,type|{@assignees,body,labels,milestone,owner,repo,title|{@description,items,type|"Usernames to assign to this issue",{@type|string},array},{@description,type|"Issue body content",string},{@description,items,type|"Labels to apply to this issue",{@type|string},array},{@description,type|"Milestone number",number},{@description,type|"Repository owner",string},{@description,type|"Repository name",string},{@description,type|"Issue title",string}},[owner,repo,title],object}},create_issue,"Create a new issue in a GitHub repository."|{{@properties,required,type|{@branch,content,message,owner,path,repo,sha|{@description,type|"Branch to create/update the file in",string},{@description,type|"Content of the file",string},{@description,type|"Commit message",string},{@description,type|"Repository owner (username or organization)",string},{@description,type|"Path where to create/update the file",string},{@description,type|"Repository name",string},{@description,type|"SHA of file being replaced (for updates)",string}},[owner,repo,path,content,message,branch],object}},create_or_update_file,"Create or update a single file in a GitHub repository. If updating, you must provide the SHA of the file you want to update."|{{@properties,required,type|{@commitID,owner,pullNumber,repo|{@description,type|"SHA of commit to review",string},{@description,type|"Repository owner",string},{@description,type|"Pull request number",number},{@description,type|"Repository name",string}},[owner,repo,pullNumber],object}},create_pending_pull_request_review,"Create a pending review for a pull request. Call this first before attempting to add comments to a pending review, and ultimately submitting it
... (truncated)
minemizer
chars: 23,383 tokens: 5,319 chars_og/tok: 9.7 enc_chars/tok: 4.4
inputSchema{ json{ properties{ owner{ description; type}; repo{ description; type}; ...}; required[]; type}}; name; description
{{ {{ Repository owner; string};{ Repository name; string}; body:{ description: Comment content; type: string}; issue_number:{ description: Issue number to comment on; type: number}};[ owner; repo; issue_number; body]; object}}; add_issue_comment; Add a comment to a specific issue in a GitHub repository.↵
{{ {{ Repository owner; string};{ Repository name; string}; body:{ description: The text of the review comment; type: string}; line:{ description: The line of the blob in the pull request diff that the comment applies to. For multi-line comments, the last line of the range; type: number}; path:{ description: The relative path to the file that necessitates a comment; type: string}; pullNumber:{ description: Pull request number; type: number}; side:{ description: The side of the diff to comment on. LEFT indicates the previous state, RIGHT indicates the new state; enum:[ LEFT; RIGHT]; type: string}; startLine:{ description: For multi-line comments, the first line of the range that the comment applies to; type: number}; startSide:{ description: For multi-line comments, the starting side of the diff that the comment applies to. LEFT indicates the previous state, RIGHT indicates the new state; enum:[ LEFT; RIGHT]; type: string}; subjectType:{ description: The level at which the comment is targeted; enum:[ FILE; LINE]; type: string}};[ owner; repo; pullNumber; path; body; subjectType]; object}}; add_pull_request_review_comment_to_pending_review; Add a comment to the requester's latest pending pull request review, a pending review needs to already exist to call this (check with the user if not sure).↵
{{ {{ Repository owner; string};{ Repository name; string}; issueNumber:{ description: Issue number; type: number}};[ owner; repo; issueNumber]; object}}; assign_copilot_to_issue; Assign Copilot to a specific issue in a GitHub repository.↵↵
This tool can help with the following outcomes:↵
- a Pull Request created with source code changes to resolve the issue↵↵↵
More information can be found at:↵
- https://docs.github.com/en/copilot/using-github-copilot/using-copilot-coding-agent-to-work-on-tasks/about-assigning-tasks-to-copilot↵↵
{{ {{ Repository owner; string};{ Repository name; string}; body:{ description: Review comment text; type: string}; commitID:{ description: SHA of commit to review; type: string}; event:{ description: Review action to perform; enum:[ APPROVE; REQUEST_CHANGES; COMMENT]; type: string}; pullNumber:{ description: Pull request number; type: number}};[ owner; repo; pullNumber; body; event]; object}}; create_and_submit_pull_request_review; Create and submit a review for a pull request without review comments.↵
{{ {{ Repository owner; string};{ Repository name; string}; branch:{ description: Name for new branch; type: string}; from_branch:{ description: Source branch (defaults to repo default); type: string}};[ owner; repo; branch]; object}}; create_branch; Create a new branch in a GitHub repository
{{ {{ Repository owner; string};{ Repository name; string}; assignees:{ description: Usernames to assign to this issue; items:{ type: string}; type: array}; body:{ description: Issue body content; type: string}; labels:{ description: Labels to apply to this issue; items:{ type: string}; type: array}; milestone:{ description: Milestone number; type: number}; title:{ description: Issue title; type: string}};[ owner; repo; title]; object}}; create_issue; Create a new issue in a GitHub repository.↵
{{ {{ Repository owner (username or organization); string};{ Repository name; string}; branch:{ description: Branch to create/update the file in; type: string}; content:{ description: Content of the file; type: string}; message:{ description: Commit message; type: string}; path:{ description: Path where to create/update the file; type: string}; sha:{ description: SHA of file being replaced (for updates); type: string}};[ owner; repo; path; content; message; branch]; object}}; create_or_update_file; Create or update a single file in a GitHub repository. If updating, you must provide the SHA of the file you want to update.↵
{{ {{ Repository owner; string};{ Repository name; string}; commitID:{ description: SHA of commit to review; type: string}; pullNumber:{ description: Pull request number; type: number}};[ owner; repo; pullNumber]; object}}; create_pending_pull_request_review; Create a pending review for a pull request. Call this first before attempting to add comments to a pending review, and ultimately submitting it. A pending pull request review means a pull request review, it is pending because you create it first and submit it later, and the PR author will not see it until it is submitted.↵
{{ {{ Repository owner; string};{ Repository name; string}; base:{ description: Branch to merge into; type: string}; body:{ description: PR description; type: string}; draft:{ description: Create as draft PR; type: boolean}; head:{ description: Branch containing changes; type: string}; maintainer_can_modify:{ description: Allow maintainer edits; type: boolean}; title:{ description: PR title; type: string}};[ owner; repo; title; head; base]; object}}; create_pull_request; Create a new pull request in a GitHub repository.↵
{{ {;; autoInit:{ description: Initialize with README; type: boolean}; description:{ description: Repository description; type: string}; name:{ description: Repository name; type: string}; private:{ description: Whether repo should be private; type: boolean}};[ name]; object}}; create_repository; Create a new GitHub repository in your account
{{ {{ Repository owner (username or organization); string};{ Repository name; string}; branch:{ description: Branch to delete the file from; type: string}; message:{ description: Commit message; type: string}; path:{ description: Path to the file to delete; type: string}};[ owner; repo; path; message; branch]; object}}; delete_file; Delete a file from a GitHub repository
{{ {{ Repository owner; string};{ Repository name; string}; pullNumber:{ description: Pull request number; type: number}};[ owner; repo; pullNumber]; object}}; delete_pending_pull_request_review; Delete the requester's latest pending pull request review. Use this after the user decides not to submit a pending review, if you don't know if they already created one then check first.↵
{{ {;; state:{ description: The new state of the notification (read/done); enum:[ read; done]; type: string}; threadID:{ description: The ID of the notification thread; type: string}};[ threadID]; object}}; dismiss_notification; Dismiss a notification by marking it as read or done
{{ {{ Repository owner; string};{ Repository name; string}; organization:{ description: Organization to fork to; type: string}};[ owner; repo]; object}}; fork_repository; Fork a GitHub repository to your account or specified organization
{{ {{ The owner of the repository.; string};{ The name of the repository.; string}; alertNumber:{ description: The number of the alert.; type: number}};[ owner; repo; alertNumber]; object}}; get_code_scanning_alert; Get details of a specific code scanning alert in a GitHub repository.↵
{{ {{ Repository owner; string};{ Repository name; string}; page:{ description: Page number for pagination (min·1); minimum:·1; type: number}; perPage:{ description: Results per page for pagination (min·1, max·100); maximum:·100; minimum:·1; type: number}; sha:{ description: Commit SHA, branch name, or tag name; type: string}};[ owner; repo; sha]; object}}; get_commit; Get details for a commit from a GitHub repository
... (truncated)
minemizer (compact)
chars: 21,912 tokens: 5,112 chars_og/tok: 10.1 enc_chars/tok: 4.3
inputSchema{json{properties{owner{description;type};repo{description;type};...};required[];type}};name;description
{{{{Repository owner;string};{Repository name;string};body:{description:Comment content;type:string};issue_number:{description:Issue number to comment on;type:number}};[owner;repo;issue_number;body];object}};add_issue_comment;Add a comment to a specific issue in a GitHub repository.↵
{{{{Repository owner;string};{Repository name;string};body:{description:The text of the review comment;type:string};line:{description:The line of the blob in the pull request diff that the comment applies to. For multi-line comments, the last line of the range;type:number};path:{description:The relative path to the file that necessitates a comment;type:string};pullNumber:{description:Pull request number;type:number};side:{description:The side of the diff to comment on. LEFT indicates the previous state, RIGHT indicates the new state;enum:[LEFT;RIGHT];type:string};startLine:{description:For multi-line comments, the first line of the range that the comment applies to;type:number};startSide:{description:For multi-line comments, the starting side of the diff that the comment applies to. LEFT indicates the previous state, RIGHT indicates the new state;enum:[LEFT;RIGHT];type:string};subjectType:{description:The level at which the comment is targeted;enum:[FILE;LINE];type:string}};[owner;repo;pullNumber;path;body;subjectType];object}};add_pull_request_review_comment_to_pending_review;Add a comment to the requester's latest pending pull request review, a pending review needs to already exist to call this (check with the user if not sure).↵
{{{{Repository owner;string};{Repository name;string};issueNumber:{description:Issue number;type:number}};[owner;repo;issueNumber];object}};assign_copilot_to_issue;Assign Copilot to a specific issue in a GitHub repository.↵↵
This tool can help with the following outcomes:↵
- a Pull Request created with source code changes to resolve the issue↵↵↵
More information can be found at:↵
- https://docs.github.com/en/copilot/using-github-copilot/using-copilot-coding-agent-to-work-on-tasks/about-assigning-tasks-to-copilot↵↵
{{{{Repository owner;string};{Repository name;string};body:{description:Review comment text;type:string};commitID:{description:SHA of commit to review;type:string};event:{description:Review action to perform;enum:[APPROVE;REQUEST_CHANGES;COMMENT];type:string};pullNumber:{description:Pull request number;type:number}};[owner;repo;pullNumber;body;event];object}};create_and_submit_pull_request_review;Create and submit a review for a pull request without review comments.↵
{{{{Repository owner;string};{Repository name;string};branch:{description:Name for new branch;type:string};from_branch:{description:Source branch (defaults to repo default);type:string}};[owner;repo;branch];object}};create_branch;Create a new branch in a GitHub repository
{{{{Repository owner;string};{Repository name;string};assignees:{description:Usernames to assign to this issue;items:{type:string};type:array};body:{description:Issue body content;type:string};labels:{description:Labels to apply to this issue;items:{type:string};type:array};milestone:{description:Milestone number;type:number};title:{description:Issue title;type:string}};[owner;repo;title];object}};create_issue;Create a new issue in a GitHub repository.↵
{{{{Repository owner (username or organization);string};{Repository name;string};branch:{description:Branch to create/update the file in;type:string};content:{description:Content of the file;type:string};message:{description:Commit message;type:string};path:{description:Path where to create/update the file;type:string};sha:{description:SHA of file being replaced (for updates);type:string}};[owner;repo;path;content;message;branch];object}};create_or_update_file;Create or update a single file in a GitHub repository. If updating, you must provide the SHA of the file you want to update.↵
{{{{Repository owner;string};{Repository name;string};commitID:{description:SHA of commit to review;type:string};pullNumber:{description:Pull request number;type:number}};[owner;repo;pullNumber];object}};create_pending_pull_request_review;Create a pending review for a pull request. Call this first before attempting to add comments to a pending review, and ultimately submitting it. A pending pull request review means a pull request review, it is pending because you create it first and submit it later, and the PR author will not see it until it is submitted.↵
{{{{Repository owner;string};{Repository name;string};base:{description:Branch to merge into;type:string};body:{description:PR description;type:string};draft:{description:Create as draft PR;type:boolean};head:{description:Branch containing changes;type:string};maintainer_can_modify:{description:Allow maintainer edits;type:boolean};title:{description:PR title;type:string}};[owner;repo;title;head;base];object}};create_pull_request;Create a new pull request in a GitHub repository.↵
{{{;;autoInit:{description:Initialize with README;type:boolean};description:{description:Repository description;type:string};name:{description:Repository name;type:string};private:{description:Whether repo should be private;type:boolean}};[name];object}};create_repository;Create a new GitHub repository in your account
{{{{Repository owner (username or organization);string};{Repository name;string};branch:{description:Branch to delete the file from;type:string};message:{description:Commit message;type:string};path:{description:Path to the file to delete;type:string}};[owner;repo;path;message;branch];object}};delete_file;Delete a file from a GitHub repository
{{{{Repository owner;string};{Repository name;string};pullNumber:{description:Pull request number;type:number}};[owner;repo;pullNumber];object}};delete_pending_pull_request_review;Delete the requester's latest pending pull request review. Use this after the user decides not to submit a pending review, if you don't know if they already created one then check first.↵
{{{;;state:{description:The new state of the notification (read/done);enum:[read;done];type:string};threadID:{description:The ID of the notification thread;type:string}};[threadID];object}};dismiss_notification;Dismiss a notification by marking it as read or done
{{{{Repository owner;string};{Repository name;string};organization:{description:Organization to fork to;type:string}};[owner;repo];object}};fork_repository;Fork a GitHub repository to your account or specified organization
{{{{The owner of the repository.;string};{The name of the repository.;string};alertNumber:{description:The number of the alert.;type:number}};[owner;repo;alertNumber];object}};get_code_scanning_alert;Get details of a specific code scanning alert in a GitHub repository.↵
{{{{Repository owner;string};{Repository name;string};page:{description:Page number for pagination (min·1);minimum:1;type:number};perPage:{description:Results per page for pagination (min·1, max·100);maximum:100;minimum:1;type:number};sha:{description:Commit SHA, branch name, or tag name;type:string}};[owner;repo;sha];object}};get_commit;Get details for a commit from a GitHub repository
... (truncated)
simple_flat.json — Original: 763 chars — Tokenizer: deepseek (deepseek-ai/DeepSeek-V3)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)7632702.82.8
JSON (min)5221505.13.5
CSV234918.42.6
TSV234928.32.5
YAML4891724.42.8
TOON246938.22.6
TSON229868.92.7
minemizer2517510.23.3
minemizer (compact)224839.22.7
JSON (pretty)
chars: 763 tokens: 270 chars_og/tok: 2.8 enc_chars/tok: 2.8
<|begin▁of▁sentence|>[↵
· {↵
··· "id":·1,↵
··· "name": "Alice",↵
··· "role": "Engineer",↵
··· "department": "Backend"↵
· },↵
· {↵
··· "id":·2,↵
··· "name": "Bob",↵
··· "role": "Designer",↵
··· "department": "Frontend"↵
· },↵
· {↵
··· "id":·3,↵
··· "name": "Carol",↵
··· "role": "Manager",↵
··· "department": "Product"↵
· },↵
· {↵
··· "id":·4,↵
··· "name": "David",↵
··· "role": "Engineer",↵
··· "department": "Infrastructure"↵
· },
... (truncated)
JSON (min)
chars: 522 tokens: 150 chars_og/tok: 5.1 enc_chars/tok: 3.5
<|begin▁of▁sentence|>[{"id":1,"name":"Alice","role":"Engineer","department":"Backend"},{"id":2,"name":"Bob","role":"Designer","department":"Frontend"},{"id":3,"name":"Carol","role":"Manager","department":"Product"},{"id":4,"name":"David","role":"Engineer","department":"Infrastructure"},{"id":5,"name":"Eva","role":"Analyst","department":"Data"},{"id":6,"name":"Frank","role":"Engineer","department":"Backend"},{"id":7,"name":"Grace","role":"Designer","department":"Mobile"},{"id":8,"name":"Henry","role":"Manager","department":"Engineering"}]
CSV
chars: 234 tokens: 91 chars_og/tok: 8.4 enc_chars/tok: 2.6
<|begin▁of▁sentence|>id,name,role,department
1,Alice,Engineer,Backend
2,Bob,Designer,Frontend
3,Carol,Manager,Product
4,David,Engineer,Infrastructure
5,Eva,Analyst,Data
6,Frank,Engineer,Backend
7,Grace,Designer,Mobile
8,Henry,Manager,Engineering
TSV
chars: 234 tokens: 92 chars_og/tok: 8.3 enc_chars/tok: 2.5
<|begin▁of▁sentence|>id nameroledepartment
1AliceEngineerBackend
2BobDesignerFrontend
3CarolManagerProduct
4DavidEngineerInfrastructure
5EvaAnalystData
6FrankEngineerBackend
7GraceDesignerMobile
8HenryManagerEngineering
YAML
chars: 489 tokens: 172 chars_og/tok: 4.4 enc_chars/tok: 2.8
<|begin▁of▁sentence|>- department: Backend
· id:·1
· name: Alice
· role: Engineer
- department: Frontend
· id:·2
· name: Bob
· role: Designer
- department: Product
· id:·3
· name: Carol
· role: Manager
- department: Infrastructure
· id:·4
· name: David
· role: Engineer
- department: Data
· id:·5
· name: Eva
· role: Analyst
- department: Backend
· id:·6
· name: Frank
· role: Engineer
- department: Mobile
... (truncated)
TOON
chars: 246 tokens: 93 chars_og/tok: 8.2 enc_chars/tok: 2.6
<|begin▁of▁sentence|>[8]{id,name,role,department}:↵
··1,Alice,Engineer,Backend
··2,Bob,Designer,Frontend
··3,Carol,Manager,Product
··4,David,Engineer,Infrastructure
··5,Eva,Analyst,Data
··6,Frank,Engineer,Backend
··7,Grace,Designer,Mobile
··8,Henry,Manager,Engineering
TSON
chars: 229 tokens: 86 chars_og/tok: 8.9 enc_chars/tok: 2.7
<|begin▁of▁sentence|>{@id,name,role,department#8|1,Alice,Engineer,Backend|2,Bob,Designer,Frontend|3,Carol,Manager,Product|4,David,Engineer,Infrastructure|5,Eva,Analyst,Data|6,Frank,Engineer,Backend|7,Grace,Designer,Mobile|8,Henry,Manager,Engineering}
minemizer
chars: 251 tokens: 75 chars_og/tok: 10.2 enc_chars/tok: 3.3
<|begin▁of▁sentence|>id; name; role; department
1; Alice; Engineer; Backend
2; Bob; Designer; Frontend
3; Carol; Manager; Product
4; David; Engineer; Infrastructure
5; Eva; Analyst; Data
6; Frank; Engineer; Backend
7; Grace; Designer; Mobile
8; Henry; Manager; Engineering
minemizer (compact)
chars: 224 tokens: 83 chars_og/tok: 9.2 enc_chars/tok: 2.7
<|begin▁of▁sentence|>id;name;role;department
1;Alice;Engineer;Backend
2;Bob;Designer;Frontend
3;Carol;Manager;Product
4;David;Engineer;Infrastructure
5;Eva;Analyst;Data
6;Frank;Engineer;Backend
7;Grace;Designer;Mobile
8;Henry;Manager;Engineering
nested_objects.json — Original: 1039 chars — Tokenizer: deepseek (deepseek-ai/DeepSeek-V3)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)1,0393493.03.0
JSON (min)6181875.63.3
CSVN/A
TSVN/A
YAML6292284.62.8
TOON6752244.63.0
TSON3061248.42.5
minemizer3251208.72.7
minemizer (compact)2901198.72.4
JSON (pretty)
chars: 1,039 tokens: 349 chars_og/tok: 3.0 enc_chars/tok: 3.0
<|begin▁of▁sentence|>[↵
· {↵
··· "id": "u1",↵
··· "name": "Lukas",↵
··· "location": {↵
····· "office": "Kaunas HQ",↵
····· "floor":·12
··· },↵
··· "skills": [↵
····· "python",↵
····· "kubernetes"↵
··· ]↵
· },↵
· {↵
··· "id": "u2",↵
··· "name": "Emma",↵
··· "location": {↵
····· "office": "Boston Hub",↵
····· "floor":·7
··· },↵
··· "skills": [↵
····· "react",↵
····· "typescript",↵
····· "graphql"↵
··· ]
... (truncated)
JSON (min)
chars: 618 tokens: 187 chars_og/tok: 5.6 enc_chars/tok: 3.3
<|begin▁of▁sentence|>[{"id":"u1","name":"Lukas","location":{"office":"Kaunas HQ","floor":12},"skills":["python","kubernetes"]},{"id":"u2","name":"Emma","location":{"office":"Boston Hub","floor":7},"skills":["react","typescript","graphql"]},{"id":"u3","name":"Pierre","location":{"office":"Paris Office","floor":3},"skills":["rust"]},{"id":"u4","name":"Hana","location":{"office":"Tokyo Tower","floor":15},"skills":["go","docker"]},{"id":"u5","name":"Wei","location":{"office":"Taipei Center","floor":8},"skills":["java","spring"]},{"id":"u6","name":"Charlotte","location":{"office":"London Bridge","floor":5},"skills":["python","django"]}]
CSV: N/A
TSV: N/A
YAML
chars: 629 tokens: 228 chars_og/tok: 4.6 enc_chars/tok: 2.8
<|begin▁of▁sentence|>- id: u1
· location:↵
··· floor:·12
··· office: Kaunas HQ
· name: Lukas
· skills:↵
· - python
· - kubernetes
- id: u2
· location:↵
··· floor:·7
··· office: Boston Hub
· name: Emma
· skills:↵
· - react
· - typescript
· - graphql
- id: u3
· location:↵
··· floor:·3
··· office: Paris Office
· name: Pierre
· skills:↵
· - rust
- id: u4
... (truncated)
TOON
chars: 675 tokens: 224 chars_og/tok: 4.6 enc_chars/tok: 3.0
<|begin▁of▁sentence|>[6]:↵
· - id: u1
··· name: Lukas
··· location:↵
····· office: Kaunas HQ
····· floor:·12
··· skills[2]: python,kubernetes
· - id: u2
··· name: Emma
··· location:↵
····· office: Boston Hub
····· floor:·7
··· skills[3]: react,typescript,graphql
· - id: u3
··· name: Pierre
··· location:↵
····· office: Paris Office
····· floor:·3
··· skills[1]: rust
· - id: u4
··· name: Hana
··· location:↵
····· office: Tokyo Tower
····· floor:·15
··· skills[2]: go,docker
... (truncated)
TSON
chars: 306 tokens: 124 chars_og/tok: 8.4 enc_chars/tok: 2.5
<|begin▁of▁sentence|>{@id,name,location(@office,floor),skills#6|u1,Lukas,{"Kaunas HQ",12},[python,kubernetes]|u2,Emma,{"Boston Hub",7},[react,typescript,graphql]|u3,Pierre,{"Paris Office",3},[rust]|u4,Hana,{"Tokyo Tower",15},[go,docker]|u5,Wei,{"Taipei Center",8},[java,spring]|u6,Charlotte,{"London Bridge",5},[python,django]}
minemizer
chars: 325 tokens: 120 chars_og/tok: 8.7 enc_chars/tok: 2.7
<|begin▁of▁sentence|>id; name; location{ office; floor}; skills[]↵
u1; Lukas;{ Kaunas HQ;·12};[ python; kubernetes]↵
u2; Emma;{ Boston Hub;·7};[ react; typescript; graphql]↵
u3; Pierre;{ Paris Office;·3};[ rust]↵
u4; Hana;{ Tokyo Tower;·15};[ go; docker]↵
u5; Wei;{ Taipei Center;·8};[ java; spring]↵
u6; Charlotte;{ London Bridge;·5};[ python; django]
minemizer (compact)
chars: 290 tokens: 119 chars_og/tok: 8.7 enc_chars/tok: 2.4
<|begin▁of▁sentence|>id;name;location{office;floor};skills[]↵
u1;Lukas;{Kaunas HQ;12};[python;kubernetes]↵
u2;Emma;{Boston Hub;7};[react;typescript;graphql]↵
u3;Pierre;{Paris Office;3};[rust]↵
u4;Hana;{Tokyo Tower;15};[go;docker]↵
u5;Wei;{Taipei Center;8};[java;spring]↵
u6;Charlotte;{London Bridge;5};[python;django]
lists_of_primitives.json — Original: 610 chars — Tokenizer: deepseek (deepseek-ai/DeepSeek-V3)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)6102232.72.7
JSON (min)3301155.32.9
CSVN/A
TSVN/A
YAML3411524.02.2
TOON3391424.32.4
TSON168787.82.2
minemizer188689.02.8
minemizer (compact)165718.62.3
JSON (pretty)
chars: 610 tokens: 223 chars_og/tok: 2.7 enc_chars/tok: 2.7
<|begin▁of▁sentence|>[↵
· {↵
··· "id":·1,↵
··· "name": "Alice",↵
··· "skills": [↵
····· "python",↵
····· "go",↵
····· "rust"↵
··· ]↵
· },↵
· {↵
··· "id":·2,↵
··· "name": "Bob",↵
··· "skills": [↵
····· "javascript",↵
····· "typescript"↵
··· ]↵
· },↵
· {↵
··· "id":·3,↵
··· "name": "Carol",↵
··· "skills": [↵
····· "java",↵
····· "kotlin",↵
····· "scala",
... (truncated)
JSON (min)
chars: 330 tokens: 115 chars_og/tok: 5.3 enc_chars/tok: 2.9
<|begin▁of▁sentence|>[{"id":1,"name":"Alice","skills":["python","go","rust"]},{"id":2,"name":"Bob","skills":["javascript","typescript"]},{"id":3,"name":"Carol","skills":["java","kotlin","scala","groovy"]},{"id":4,"name":"David","skills":["c","cpp"]},{"id":5,"name":"Eva","skills":["ruby","elixir","erlang"]},{"id":6,"name":"Frank","skills":["swift"]}]
CSV: N/A
TSV: N/A
YAML
chars: 341 tokens: 152 chars_og/tok: 4.0 enc_chars/tok: 2.2
<|begin▁of▁sentence|>- id:·1
· name: Alice
· skills:↵
· - python
· - go
· - rust
- id:·2
· name: Bob
· skills:↵
· - javascript
· - typescript
- id:·3
· name: Carol
· skills:↵
· - java
· - kotlin
· - scala
· - groovy
- id:·4
· name: David
· skills:↵
· - c
· - cpp
- id:·5
· name: Eva
... (truncated)
TOON
chars: 339 tokens: 142 chars_og/tok: 4.3 enc_chars/tok: 2.4
<|begin▁of▁sentence|>[6]:↵
· - id:·1
··· name: Alice
··· skills[3]: python,go,rust
· - id:·2
··· name: Bob
··· skills[2]: javascript,typescript
· - id:·3
··· name: Carol
··· skills[4]: java,kotlin,scala,groovy
· - id:·4
··· name: David
··· skills[2]: c,cpp
· - id:·5
··· name: Eva
··· skills[3]: ruby,elixir,erlang
· - id:·6
··· name: Frank
··· skills[1]: swift
TSON
chars: 168 tokens: 78 chars_og/tok: 7.8 enc_chars/tok: 2.2
<|begin▁of▁sentence|>{@id,name,skills#6|1,Alice,[python,go,rust]|2,Bob,[javascript,typescript]|3,Carol,[java,kotlin,scala,groovy]|4,David,[c,cpp]|5,Eva,[ruby,elixir,erlang]|6,Frank,[swift]}
minemizer
chars: 188 tokens: 68 chars_og/tok: 9.0 enc_chars/tok: 2.8
<|begin▁of▁sentence|>id; name; skills[]↵
1; Alice;[ python; go; rust]↵
2; Bob;[ javascript; typescript]↵
3; Carol;[ java; kotlin; scala; groovy]↵
4; David;[ c; cpp]↵
5; Eva;[ ruby; elixir; erlang]↵
6; Frank;[ swift]
minemizer (compact)
chars: 165 tokens: 71 chars_og/tok: 8.6 enc_chars/tok: 2.3
<|begin▁of▁sentence|>id;name;skills[]↵
1;Alice;[python;go;rust]↵
2;Bob;[javascript;typescript]↵
3;Carol;[java;kotlin;scala;groovy]↵
4;David;[c;cpp]↵
5;Eva;[ruby;elixir;erlang]↵
6;Frank;[swift]
sparse_data.json — Original: 611 chars — Tokenizer: deepseek (deepseek-ai/DeepSeek-V3)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)6112292.72.7
JSON (min)4001264.83.2
CSVN/A
TSVN/A
YAML3841504.12.6
TOON4381603.82.7
TSON3281175.22.8
minemizer200738.42.7
minemizer (compact)180768.02.4
JSON (pretty)
chars: 611 tokens: 229 chars_og/tok: 2.7 enc_chars/tok: 2.7
<|begin▁of▁sentence|>[↵
· {↵
··· "id":·1,↵
··· "name": "Erik",↵
··· "department": "Engineering"↵
· },↵
· {↵
··· "id":·2,↵
··· "name": "Rachel",↵
··· "department": "Design",↵
··· "remote": true
· },↵
· {↵
··· "id":·3,↵
··· "name": "Hans"↵
· },↵
· {↵
··· "id":·4,↵
··· "name": "Kenji",↵
··· "department": "Sales",↵
··· "slack": "@kenji",↵
··· "remote": false
· },↵
· {↵
··· "id":·5,
... (truncated)
JSON (min)
chars: 400 tokens: 126 chars_og/tok: 4.8 enc_chars/tok: 3.2
<|begin▁of▁sentence|>[{"id":1,"name":"Erik","department":"Engineering"},{"id":2,"name":"Rachel","department":"Design","remote":true},{"id":3,"name":"Hans"},{"id":4,"name":"Kenji","department":"Sales","slack":"@kenji","remote":false},{"id":5,"name":"Mai","remote":true},{"id":6,"name":"Tom","department":"Engineering"},{"id":7,"name":"Priya","slack":"@priya","remote":true},{"id":8,"name":"Nina","department":"Marketing"}]
CSV: N/A
TSV: N/A
YAML
chars: 384 tokens: 150 chars_og/tok: 4.1 enc_chars/tok: 2.6
<|begin▁of▁sentence|>- department: Engineering
· id:·1
· name: Erik
- department: Design
· id:·2
· name: Rachel
· remote: true
- id:·3
· name: Hans
- department: Sales
· id:·4
· name: Kenji
· remote: false
· slack: '@kenji'↵
- id:·5
· name: Mai
· remote: true
- department: Engineering
· id:·6
· name: Tom
- id:·7
· name: Priya
· remote: true
· slack: '@priya'↵
- department: Marketing
... (truncated)
TOON
chars: 438 tokens: 160 chars_og/tok: 3.8 enc_chars/tok: 2.7
<|begin▁of▁sentence|>[8]:↵
· - id:·1
··· name: Erik
··· department: Engineering
· - id:·2
··· name: Rachel
··· department: Design
··· remote: true
· - id:·3
··· name: Hans
· - id:·4
··· name: Kenji
··· department: Sales
··· slack: @kenji
··· remote: false
· - id:·5
··· name: Mai
··· remote: true
· - id:·6
··· name: Tom
··· department: Engineering
· - id:·7
··· name: Priya
··· slack: @priya
··· remote: true
... (truncated)
TSON
chars: 328 tokens: 117 chars_og/tok: 5.2 enc_chars/tok: 2.8
<|begin▁of▁sentence|>[{@id,name,department|1,Erik,Engineering},{@id,name,department,remote|2,Rachel,Design,true},{@id,name|3,Hans},{@id,name,department,slack,remote|4,Kenji,Sales,"@kenji",false},{@id,name,remote|5,Mai,true},{@id,name,department|6,Tom,Engineering},{@id,name,slack,remote|7,Priya,"@priya",true},{@id,name,department|8,Nina,Marketing}]
minemizer
chars: 200 tokens: 73 chars_og/tok: 8.4 enc_chars/tok: 2.7
<|begin▁of▁sentence|>id; name; department; remote
1; Erik; Engineering
2; Rachel; Design;true
3; Hans
4; Kenji; Sales;false; slack: @kenji
5; Mai;;true
6; Tom; Engineering
7; Priya;;true; slack: @priya
8; Nina; Marketing;
minemizer (compact)
chars: 180 tokens: 76 chars_og/tok: 8.0 enc_chars/tok: 2.4
<|begin▁of▁sentence|>id;name;department;remote
1;Erik;Engineering
2;Rachel;Design;true
3;Hans
4;Kenji;Sales;false;slack:@kenji
5;Mai;;true
6;Tom;Engineering
7;Priya;;true;slack:@priya
8;Nina;Marketing;
complex_mixed.json — Original: 1320 chars — Tokenizer: deepseek (deepseek-ai/DeepSeek-V3)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)1,3204283.13.1
JSON (min)7602395.53.2
CSVN/A
TSVN/A
YAML8182794.72.9
TOON8812794.73.2
TSON4531946.82.3
minemizer4031618.22.5
minemizer (compact)3611598.32.3
JSON (pretty)
chars: 1,320 tokens: 428 chars_og/tok: 3.1 enc_chars/tok: 3.1
<|begin▁of▁sentence|>[↵
· {↵
··· "id":·1,↵
··· "profile": {↵
····· "name": "Grace",↵
····· "location": {↵
······· "city": "NYC",↵
······· "country": "USA"↵
····· }↵
··· },↵
··· "tags": [↵
····· "admin",↵
····· "verified"↵
··· ],↵
··· "metadata": {↵
····· "created": "2024-01-15"↵
··· }↵
· },↵
· {↵
··· "id":·2,↵
··· "profile": {↵
····· "name": "Henry",↵
····· "location": {↵
······· "city": "London",↵
······· "country": "UK"
... (truncated)
JSON (min)
chars: 760 tokens: 239 chars_og/tok: 5.5 enc_chars/tok: 3.2
<|begin▁of▁sentence|>[{"id":1,"profile":{"name":"Grace","location":{"city":"NYC","country":"USA"}},"tags":["admin","verified"],"metadata":{"created":"2024-01-15"}},{"id":2,"profile":{"name":"Henry","location":{"city":"London","country":"UK"}},"tags":["user"],"metadata":{"created":"2024-02-20","updated":"2024-03-10"}},{"id":3,"profile":{"name":"Ivy","location":{"city":"Tokyo","country":"Japan"}},"tags":["moderator","verified","premium"],"metadata":{"created":"2024-01-05"}},{"id":4,"profile":{"name":"Jack","location":{"city":"Sydney","country":"Australia"}},"tags":["user","new"],"metadata":{"created":"2024-04-01"}},{"id":5,"profile":{"name":"Kate","location":{"city":"Berlin","country":"Germany"}},"tags":["admin"],"metadata":{"created":"2023-12-01","updated":"2024-02-15"}}]
CSV: N/A
TSV: N/A
YAML
chars: 818 tokens: 279 chars_og/tok: 4.7 enc_chars/tok: 2.9
<|begin▁of▁sentence|>- id:·1
· metadata:↵
··· created: '2024-01-15'↵
· profile:↵
··· location:↵
····· city: NYC
····· country: USA
··· name: Grace
· tags:↵
· - admin
· - verified
- id:·2
· metadata:↵
··· created: '2024-02-20'↵
··· updated: '2024-03-10'↵
· profile:↵
··· location:↵
····· city: London
····· country: UK
··· name: Henry
· tags:↵
· - user
- id:·3
· metadata:↵
··· created: '2024-01-05'
... (truncated)
TOON
chars: 881 tokens: 279 chars_og/tok: 4.7 enc_chars/tok: 3.2
<|begin▁of▁sentence|>[5]:↵
· - id:·1
··· profile:↵
····· name: Grace
····· location:↵
······· city: NYC
······· country: USA
··· tags[2]: admin,verified
··· metadata:↵
····· created:·2024-01-15
· - id:·2
··· profile:↵
····· name: Henry
····· location:↵
······· city: London
······· country: UK
··· tags[1]: user
··· metadata:↵
····· created:·2024-02-20
····· updated:·2024-03-10
· - id:·3
··· profile:↵
····· name: Ivy
····· location:↵
······· city: Tokyo
... (truncated)
TSON
chars: 453 tokens: 194 chars_og/tok: 6.8 enc_chars/tok: 2.3
<|begin▁of▁sentence|>{@id,profile(@name,location),tags,metadata#5|1,{Grace,{@city,country|NYC,USA}},[admin,verified],{@created|2024-01-15}|2,{Henry,{@city,country|London,UK}},[user],{@created,updated|2024-02-20,2024-03-10}|3,{Ivy,{@city,country|Tokyo,Japan}},[moderator,verified,premium],{@created|2024-01-05}|4,{Jack,{@city,country|Sydney,Australia}},[user,new],{@created|2024-04-01}|5,{Kate,{@city,country|Berlin,Germany}},[admin],{@created,updated|2023-12-01,2024-02-15}}
minemizer
chars: 403 tokens: 161 chars_og/tok: 8.2 enc_chars/tok: 2.5
<|begin▁of▁sentence|>id; profile{ name; location{ city; country}}; tags[]; metadata{ created; ...}↵
1;{ Grace;{ NYC; USA}};[ admin; verified];{·2024-01-15}↵
2;{ Henry;{ London; UK}};[ user];{·2024-02-20; updated:·2024-03-10}↵
3;{ Ivy;{ Tokyo; Japan}};[ moderator; verified; premium];{·2024-01-05}↵
4;{ Jack;{ Sydney; Australia}};[ user; new];{·2024-04-01}↵
5;{ Kate;{ Berlin; Germany}};[ admin];{·2023-12-01; updated:·2024-02-15}
minemizer (compact)
chars: 361 tokens: 159 chars_og/tok: 8.3 enc_chars/tok: 2.3
<|begin▁of▁sentence|>id;profile{name;location{city;country}};tags[];metadata{created;...}↵
1;{Grace;{NYC;USA}};[admin;verified];{2024-01-15}↵
2;{Henry;{London;UK}};[user];{2024-02-20;updated:2024-03-10}↵
3;{Ivy;{Tokyo;Japan}};[moderator;verified;premium];{2024-01-05}↵
4;{Jack;{Sydney;Australia}};[user;new];{2024-04-01}↵
5;{Kate;{Berlin;Germany}};[admin];{2023-12-01;updated:2024-02-15}
books.json — Original: 27902 chars — Tokenizer: deepseek (deepseek-ai/DeepSeek-V3)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)27,9028,9553.13.1
JSON (min)22,5016,1664.53.6
CSV14,0714,4636.33.2
TSV14,0574,6806.03.0
YAML22,4007,1593.93.1
TOON14,2774,4356.33.2
TSON14,4484,4846.23.2
minemizer14,4584,5206.23.2
minemizer (compact)13,7534,3876.43.1
JSON (pretty)
chars: 27,902 tokens: 8,955 chars_og/tok: 3.1 enc_chars/tok: 3.1
<|begin▁of▁sentence|>[↵
· {↵
··· "author": "Chinua Achebe",↵
··· "country": "Nigeria",↵
··· "imageLink": "images/things-fall-apart.jpg",↵
··· "language": "English",↵
··· "link": "https://en.wikipedia.org/wiki/Things_Fall_Apart\n",↵
··· "pages":·209,↵
··· "title": "Things Fall Apart",↵
··· "year":·1958
· },↵
· {↵
··· "author": "Hans Christian Andersen",↵
··· "country": "Denmark",↵
··· "imageLink": "images/fairy-tales.jpg",↵
··· "language": "Danish",↵
··· "link": "https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.\n",↵
··· "pages":·784,↵
··· "title": "Fairy tales",↵
··· "year":·1836
· },↵
· {↵
··· "author": "Dante Alighieri",↵
··· "country": "Italy",↵
··· "imageLink": "images/the-divine-comedy.jpg",
... (truncated)
JSON (min)
chars: 22,501 tokens: 6,166 chars_og/tok: 4.5 enc_chars/tok: 3.6
<|begin▁of▁sentence|>[{"author":"Chinua Achebe","country":"Nigeria","imageLink":"images/things-fall-apart.jpg","language":"English","link":"https://en.wikipedia.org/wiki/Things_Fall_Apart\n","pages":209,"title":"Things Fall Apart","year":1958},{"author":"Hans Christian Andersen","country":"Denmark","imageLink":"images/fairy-tales.jpg","language":"Danish","link":"https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.\n","pages":784,"title":"Fairy tales","year":1836},{"author":"Dante Alighieri","country":"Italy","imageLink":"images/the-divine-comedy.jpg","language":"Italian","link":"https://en.wikipedia.org/wiki/Divine_Comedy\n","pages":928,"title":"The Divine Comedy","year":1315},{"author":"Unknown","country":"Sumer and Akkadian Empire","imageLink":"images/the-epic-of-gilgamesh.jpg","language":"Akkadian","link":"https://en.wikipedia.org/wiki/Epic_of_Gilgamesh\n","pages":160,"title":"The Epic Of Gilgamesh","year":-1700},{"author":"Unknown","country":"Achaemenid Empire","imageLink":"images/the-book-of-job.jpg","language":"Hebrew","link":"https://en.wikipedia.org/wiki/Book_of_Job\n","pages":176,"title":"The Book Of Job","year":-600},{"author":"Unknown","country":"India/Iran/Iraq/Egypt/Tajikistan","imageLink":"images/one-thousand-and-one-nights.jpg","language":"Arabic","link":"https://en.wikipedia.org/wiki/One_Thousand_and_One_Nights\n","pages":288,"title":"One Thousand and One Nights","year":1200},{"author":"Unknown","country":"Iceland","imageLink":"images/njals-saga.jpg","language":"Old Norse","link":"https://en.wikipedia.org/wiki/Nj%C3%A1ls_saga\n","pages":384,"title":"Nj\u00e1l's Saga","year":1350},{"author":"Jane Austen","country":"United Kingdom","imageLink":"images/pride-and-prejudice.jpg","language":"English","link":"https://en.wikipedia.org/wiki/Pride_and_Prejudice\n","pages":226,"title":"Pride and Prejudice","year":1813},{"author":"Honor\u00e9 de Balzac","country":"France","imageLink":"images/le-pere-goriot.jpg","language":"French","link":"https://en.wikipedia.org/wiki/Le_P%C3%A8re_Goriot\n","pages":443,"title":"Le P\u00e8re Goriot","year":1835},{"author":"Samuel Beckett","country":"Republic of Ireland","imageLink":"images/molloy-malone-dies-the-unnamable.jpg","language":"French, English","link":"https://en.wikipedia.org/wiki/Molloy_(novel)\n","pages":256,"title":"Molloy, Malone Dies, The Unnamable, the trilogy","year":1952},{"author":"Giovanni Boccaccio","country":"Italy","imageLink":"images/the-decameron.jpg","language":"Italian","link":"https://en.wikipedia.org/wiki/The_Decameron\n","pages":1024,"title":"The Decameron","year":1351},{"author":"Jorge Luis Borges","country":"Argentina","imageLink":"images/ficciones.jpg","language":"Spanish","link":"https://en.wikipedia.org/wiki/Ficciones\n","pages":224,"title":"Ficciones","year":1965},{"author":"Emily Bront\u00eb","country":"United Kingdom","imageLink":"images/wuthering-heights.jpg","language":"English","link":"https://en.wikipedia.org/wiki/Wuthering_Heights\n","pages":342,"title":"Wuthering Heights","year":1847},{"author":"Albert Camus","country":"Algeria, French Empire","imageLink":"images/l-etranger.jpg","language":"French","link":"https://en.wikipedia.org/wiki/The_Stranger_(novel)\n","pages":185,"title":"The Stranger","year":1942},{"author":"Paul Celan","country":"Romania, France","imageLink":"images/poems-paul-celan.jpg","language":"German","link":"\n","pages":320,"title":"Poems","year":1952},{"author":"Louis-Ferdinand C\u00e9line","country":"France","imageLink":"images/voyage-au-bout-de-la-nuit.jpg","language":"French","link":"https://en.wikipedia.org/wiki/Journey_to_the_End_of_the_Night\n","pages":505,"title":"Journey to the End of the Night","year":1932},{"author":"Miguel de Cervantes","country":"Spain","imageLink":"images/don-quijote-de-la-mancha.jpg","language":"Spanish","link":"https://en.wikipedia.org/wiki/Don_Quixote\n","pages":1056,"title":"Don Quijote De La Mancha","year":1610},{"author":"Geoffrey Chaucer","country":"England","imageLink":"images/the-canterbury-tales.jpg","language":"English","link":"https://en.wikipedia.org/wiki/The_Canterbury_Tales\n","pages":544,"title":"The Canterbury Tales","year":1450},{"author":"Anton Chekhov","country":"Russia","imageLink":"images/stories-of-anton-chekhov.jpg","language":"Russian","link":"https://en.wikipedia.org/wiki/List_of_short_stories_by_Anton_Chekhov\n","pages":194,"title":"Stories","year":1886},{"author":"Joseph Conrad","country":"United Kingdom","imageLink":"images/nostromo.jpg","language":"English","link":"https://en.wikipedia.org/wiki/Nostromo\n","pages":320,"title":"Nostromo","year":1904},{"author":"Charles Dickens","country":"United Kingdom","imageLink":"images/great-expectations.jpg","language":"English","link":"https://en.wikipedia.org/wiki/Great_Expectations\n","pages":194,"title":"Great Expectations","year":1861},{"author":"Denis Diderot","country":"France","imageLink":"images/jacques-the-fatalist.jpg","language":"French","link":"https://en.wikipedia.org/wiki/Jacques_the_Fatalis
... (truncated)
CSV
chars: 14,071 tokens: 4,463 chars_og/tok: 6.3 enc_chars/tok: 3.2
<|begin▁of▁sentence|>author,country,imageLink,language,link,pages,title,year
Chinua Achebe,Nigeria,images/things-fall-apart.jpg,English,"https://en.wikipedia.org/wiki/Things_Fall_Apart
",209,Things Fall Apart,1958
Hans Christian Andersen,Denmark,images/fairy-tales.jpg,Danish,"https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.↵
",784,Fairy tales,1836
Dante Alighieri,Italy,images/the-divine-comedy.jpg,Italian,"https://en.wikipedia.org/wiki/Divine_Comedy
",928,The Divine Comedy,1315
Unknown,Sumer and Akkadian Empire,images/the-epic-of-gilgamesh.jpg,Akkadian,"https://en.wikipedia.org/wiki/Epic_of_Gilgamesh
",160,The Epic Of Gilgamesh,-1700
Unknown,Achaemenid Empire,images/the-book-of-job.jpg,Hebrew,"https://en.wikipedia.org/wiki/Book_of_Job
",176,The Book Of Job,-600
Unknown,India/Iran/Iraq/Egypt/Tajikistan,images/one-thousand-and-one-nights.jpg,Arabic,"https://en.wikipedia.org/wiki/One_Thousand_and_One_Nights
",288,One Thousand and One Nights,1200
Unknown,Iceland,images/njals-saga.jpg,Old Norse,"https://en.wikipedia.org/wiki/Nj%C3%A1ls_saga
",384,Njál's Saga,1350
Jane Austen,United Kingdom,images/pride-and-prejudice.jpg,English,"https://en.wikipedia.org/wiki/Pride_and_Prejudice
",226,Pride and Prejudice,1813
Honoré de Balzac,France,images/le-pere-goriot.jpg,French,"https://en.wikipedia.org/wiki/Le_P%C3%A8re_Goriot
",443,Le Père Goriot,1835
Samuel Beckett,Republic of Ireland,images/molloy-malone-dies-the-unnamable.jpg,"French, English","https://en.wikipedia.org/wiki/Molloy_(novel)↵
",256,"Molloy, Malone Dies, The Unnamable, the trilogy",1952
Giovanni Boccaccio,Italy,images/the-decameron.jpg,Italian,"https://en.wikipedia.org/wiki/The_Decameron
",1024,The Decameron,1351
Jorge Luis Borges,Argentina,images/ficciones.jpg,Spanish,"https://en.wikipedia.org/wiki/Ficciones
",224,Ficciones,1965
... (truncated)
TSV
chars: 14,057 tokens: 4,680 chars_og/tok: 6.0 enc_chars/tok: 3.0
<|begin▁of▁sentence|>authorcountryimageLinklanguagelink pagestitleyear
Chinua AchebeNigeriaimages/things-fall-apart.jpgEnglish"https://en.wikipedia.org/wiki/Things_Fall_Apart
"209Things Fall Apart1958
Hans Christian AndersenDenmarkimages/fairy-tales.jpgDanish"https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.↵
"784Fairy tales1836
Dante AlighieriItalyimages/the-divine-comedy.jpgItalian"https://en.wikipedia.org/wiki/Divine_Comedy
"928The Divine Comedy1315
Unknown Sumer and Akkadian Empireimages/the-epic-of-gilgamesh.jpg Akkadian"https://en.wikipedia.org/wiki/Epic_of_Gilgamesh
"160The Epic Of Gilgamesh-1700
Unknown Achaemenid Empireimages/the-book-of-job.jpgHebrew"https://en.wikipedia.org/wiki/Book_of_Job
"176The Book Of Job-600
UnknownIndia/Iran/Iraq/Egypt/Tajikistanimages/one-thousand-and-one-nights.jpgArabic"https://en.wikipedia.org/wiki/One_Thousand_and_One_Nights
"288One Thousand and One Nights1200
UnknownIcelandimages/njals-saga.jpgOld Norse"https://en.wikipedia.org/wiki/Nj%C3%A1ls_saga
"384Njál's Saga1350
Jane AustenUnited Kingdomimages/pride-and-prejudice.jpgEnglish"https://en.wikipedia.org/wiki/Pride_and_Prejudice
"226Pride and Prejudice1813
Honoré de BalzacFranceimages/le-pere-goriot.jpgFrench"https://en.wikipedia.org/wiki/Le_P%C3%A8re_Goriot
"443Le Père Goriot1835
Samuel BeckettRepublic of Irelandimages/molloy-malone-dies-the-unnamable.jpgFrench, English"https://en.wikipedia.org/wiki/Molloy_(novel)↵
"256Molloy, Malone Dies, The Unnamable, the trilogy1952
Giovanni BoccaccioItalyimages/the-decameron.jpgItalian"https://en.wikipedia.org/wiki/The_Decameron
"1024The Decameron1351
Jorge Luis BorgesArgentinaimages/ficciones.jpgSpanish"https://en.wikipedia.org/wiki/Ficciones
"224Ficciones1965
... (truncated)
YAML
chars: 22,400 tokens: 7,159 chars_og/tok: 3.9 enc_chars/tok: 3.1
<|begin▁of▁sentence|>- author: Chinua Achebe
· country: Nigeria
· imageLink: images/things-fall-apart.jpg
· language: English
· link: 'https://en.wikipedia.org/wiki/Things_Fall_Apart↵↵
··· '↵
· pages:·209
· title: Things Fall Apart
· year:·1958
- author: Hans Christian Andersen
· country: Denmark
· imageLink: images/fairy-tales.jpg
· language: Danish
· link: 'https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.↵↵
··· '↵
· pages:·784
· title: Fairy tales
· year:·1836
- author: Dante Alighieri
· country: Italy
· imageLink: images/the-divine-comedy.jpg
· language: Italian
· link: 'https://en.wikipedia.org/wiki/Divine_Comedy
... (truncated)
TOON
chars: 14,277 tokens: 4,435 chars_og/tok: 6.3 enc_chars/tok: 3.2
<|begin▁of▁sentence|>[100]{author,country,imageLink,language,link,pages,title,year}:↵
· Chinua Achebe,Nigeria,images/things-fall-apart.jpg,English,"https://en.wikipedia.org/wiki/Things_Fall_Apart\n",209,Things Fall Apart,1958
· Hans Christian Andersen,Denmark,images/fairy-tales.jpg,Danish,"https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.\n",784,Fairy tales,1836
· Dante Alighieri,Italy,images/the-divine-comedy.jpg,Italian,"https://en.wikipedia.org/wiki/Divine_Comedy\n",928,The Divine Comedy,1315
· Unknown,Sumer and Akkadian Empire,images/the-epic-of-gilgamesh.jpg,Akkadian,"https://en.wikipedia.org/wiki/Epic_of_Gilgamesh\n",160,The Epic Of Gilgamesh,-1700
· Unknown,Achaemenid Empire,images/the-book-of-job.jpg,Hebrew,"https://en.wikipedia.org/wiki/Book_of_Job\n",176,The Book Of Job,-600
· Unknown,India/Iran/Iraq/Egypt/Tajikistan,images/one-thousand-and-one-nights.jpg,Arabic,"https://en.wikipedia.org/wiki/One_Thousand_and_One_Nights\n",288,One Thousand and One Nights,1200
· Unknown,Iceland,images/njals-saga.jpg,Old Norse,"https://en.wikipedia.org/wiki/Nj%C3%A1ls_saga\n",384,Njál's Saga,1350
· Jane Austen,United Kingdom,images/pride-and-prejudice.jpg,English,"https://en.wikipedia.org/wiki/Pride_and_Prejudice\n",226,Pride and Prejudice,1813
· Honoré de Balzac,France,images/le-pere-goriot.jpg,French,"https://en.wikipedia.org/wiki/Le_P%C3%A8re_Goriot\n",443,Le Père Goriot,1835
· Samuel Beckett,Republic of Ireland,images/molloy-malone-dies-the-unnamable.jpg,"French, English","https://en.wikipedia.org/wiki/Molloy_(novel)\n",256,"Molloy, Malone Dies, The Unnamable, the trilogy",1952
· Giovanni Boccaccio,Italy,images/the-decameron.jpg,Italian,"https://en.wikipedia.org/wiki/The_Decameron\n",1024,The Decameron,1351
· Jorge Luis Borges,Argentina,images/ficciones.jpg,Spanish,"https://en.wikipedia.org/wiki/Ficciones\n",224,Ficciones,1965
· Emily Brontë,United Kingdom,images/wuthering-heights.jpg,English,"https://en.wikipedia.org/wiki/Wuthering_Heights\n",342,Wuthering Heights,1847
· Albert Camus,"Algeria, French Empire",images/l-etranger.jpg,French,"https://en.wikipedia.org/wiki/The_Stranger_(novel)\n",185,The Stranger,1942
· Paul Celan,"Romania, France",images/poems-paul-celan.jpg,German,"\n",320,Poems,1952
· Louis-Ferdinand Céline,France,images/voyage-au-bout-de-la-nuit.jpg,French,"https://en.wikipedia.org/wiki/Journey_to_the_End_of_the_Night\n",505,Journey to the End of the Night,1932
· Miguel de Cervantes,Spain,images/don-quijote-de-la-mancha.jpg,Spanish,"https://en.wikipedia.org/wiki/Don_Quixote\n",1056,Don Quijote De La Mancha,1610
· Geoffrey Chaucer,England,images/the-canterbury-tales.jpg,English,"https://en.wikipedia.org/wiki/The_Canterbury_Tales\n",544,The Canterbury Tales,1450
· Anton Chekhov,Russia,images/stories-of-anton-chekhov.jpg,Russian,"https://en.wikipedia.org/wiki/List_of_short_stories_by_Anton_Chekhov\n",194,Stories,1886
· Joseph Conrad,United Kingdom,images/nostromo.jpg,English,"https://en.wikipedia.org/wiki/Nostromo\n",320,Nostromo,1904
· Charles Dickens,United Kingdom,images/great-expectations.jpg,English,"https://en.wikipedia.org/wiki/Great_Expectations\n",194,Great Expectations,1861
· Denis Diderot,France,images/jacques-the-fatalist.jpg,French,"https://en.wikipedia.org/wiki/Jacques_the_Fatalist\n",596,Jacques the Fatalist,1796
· Alfred Döblin,Germany,images/berlin-alexanderplatz.jpg,German,"https://en.wikipedia.org/wiki/Berlin_Alexanderplatz\n",600,Berlin Alexanderplatz,1929
· Fyodor Dostoevsky,Russia,images/crime-and-punishment.jpg,Russian,"https://en.wikipedia.org/wiki/Crime_and_Punishment\n",551,Crime and Punishment,1866
... (truncated)
TSON
chars: 14,448 tokens: 4,484 chars_og/tok: 6.2 enc_chars/tok: 3.2
<|begin▁of▁sentence|>{@author,country,imageLink,language,link,pages,title,year#100|"Chinua Achebe",Nigeria,images/things-fall-apart.jpg,English,"https://en.wikipedia.org/wiki/Things_Fall_Apart\n",209,"Things Fall Apart",1958|"Hans Christian Andersen",Denmark,images/fairy-tales.jpg,Danish,"https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.\n",784,"Fairy tales",1836|"Dante Alighieri",Italy,images/the-divine-comedy.jpg,Italian,"https://en.wikipedia.org/wiki/Divine_Comedy\n",928,"The Divine Comedy",1315|Unknown,"Sumer and Akkadian Empire",images/the-epic-of-gilgamesh.jpg,Akkadian,"https://en.wikipedia.org/wiki/Epic_of_Gilgamesh\n",160,"The Epic Of Gilgamesh",-1700|Unknown,"Achaemenid Empire",images/the-book-of-job.jpg,Hebrew,"https://en.wikipedia.org/wiki/Book_of_Job\n",176,"The Book Of Job",-600|Unknown,India/Iran/Iraq/Egypt/Tajikistan,images/one-thousand-and-one-nights.jpg,Arabic,"https://en.wikipedia.org/wiki/One_Thousand_and_One_Nights\n",288,"One Thousand and One Nights",1200|Unknown,Iceland,images/njals-saga.jpg,"Old Norse","https://en.wikipedia.org/wiki/Nj%C3%A1ls_saga\n",384,"Njál's Saga",1350|"Jane Austen","United Kingdom",images/pride-and-prejudice.jpg,English,"https://en.wikipedia.org/wiki/Pride_and_Prejudice\n",226,"Pride and Prejudice",1813|"Honoré de Balzac",France,images/le-pere-goriot.jpg,French,"https://en.wikipedia.org/wiki/Le_P%C3%A8re_Goriot\n",443,"Le Père Goriot",1835|"Samuel Beckett","Republic of Ireland",images/molloy-malone-dies-the-unnamable.jpg,"French, English","https://en.wikipedia.org/wiki/Molloy_(novel)\n",256,"Molloy, Malone Dies, The Unnamable, the trilogy",1952|"Giovanni Boccaccio",Italy,images/the-decameron.jpg,Italian,"https://en.wikipedia.org/wiki/The_Decameron\n",1024,"The Decameron",1351|"Jorge Luis Borges",Argentina,images/ficciones.jpg,Spanish,"https://en.wikipedia.org/wiki/Ficciones\n",224,Ficciones,1965|"Emily Brontë","United Kingdom",images/wuthering-heights.jpg,English,"https://en.wikipedia.org/wiki/Wuthering_Heights\n",342,"Wuthering Heights",1847|"Albert Camus","Algeria, French Empire",images/l-etranger.jpg,French,"https://en.wikipedia.org/wiki/The_Stranger_(novel)\n",185,"The Stranger",1942|"Paul Celan","Romania, France",images/poems-paul-celan.jpg,German,"\n",320,Poems,1952|"Louis-Ferdinand Céline",France,images/voyage-au-bout-de-la-nuit.jpg,French,"https://en.wikipedia.org/wiki/Journey_to_the_End_of_the_Night\n",505,"Journey to the End of the Night",1932|"Miguel de Cervantes",Spain,images/don-quijote-de-la-mancha.jpg,Spanish,"https://en.wikipedia.org/wiki/Don_Quixote\n",1056,"Don Quijote De La Mancha",1610|"Geoffrey Chaucer",England,images/the-canterbury-tales.jpg,English,"https://en.wikipedia.org/wiki/The_Canterbury_Tales\n",544,"The Canterbury Tales",1450|"Anton Chekhov",Russia,images/stories-of-anton-chekhov.jpg,Russian,"https://en.wikipedia.org/wiki/List_of_short_stories_by_Anton_Chekhov\n",194,Stories,1886|"Joseph Conrad","United Kingdom",images/nostromo.jpg,English,"https://en.wikipedia.org/wiki/Nostromo\n",320,Nostromo,1904|"Charles Dickens","United Kingdom",images/great-expectations.jpg,English,"https://en.wikipedia.org/wiki/Great_Expectations\n",194,"Great Expectations",1861|"Denis Diderot",France,images/jacques-the-fatalist.jpg,French,"https://en.wikipedia.org/wiki/Jacques_the_Fatalist\n",596,"Jacques the Fatalist",1796|"Alfred Döblin",Germany,images/berlin-alexanderplatz.jpg,German,"https://en.wikipedia.org/wiki/Berlin_Alexanderplatz\n",600,"Berlin Alexanderplatz",1929|"Fyodor Dostoevsky",Russia,images/crime-and-punishment.jpg,Russian,"https://en.wikipedia.org/wiki/Crime_and_Punishment\n",551,"Crime and Punishment",1866|"Fyodor Dostoevsky",Russia,images/the-idiot.jpg,Russian,"https://en.wikipedia.org/wiki/The_Idiot\n",656,"The Idiot",1869|"Fyodor Dostoevsky",Russia,images/the-possessed.jpg,Russian,"https://en.wikipedia.org/wiki/Demons_(Dostoyevsky_novel)\n",768,"The Possessed",1872|"Fyodor Dostoevsky",Russia,images/the-brothers-karamazov.jpg,Russian,"https://en.wikipedia.org/wiki/The_Brothers_Karamazov\n",824,"The Brothers Karamazov",1880|"George Eliot","United Kingdom",images/middlemarch.jpg,English,"https://en.wikipedia.org/wiki/Middlemarch\n",800,Middlemarch,1871|"Ralph Ellison","United States",images/invisible-man.jpg,English,"https://en.wikipedia.org/wiki/Invisible_Man\n",581,"Invisible Man",1952|Euripides,Greece,images/medea.jpg,Greek,"https://en.wikipedia.org/wiki/Medea_(play)\n",104,Medea,-431|"William Faulkner","United States",images/absalom-absalom.jpg,English,"https://en.wikipedia.org/wiki/Absalom,_Absalom!\n",313,"Absalom, Absalom!",1936|"William Faulkner","United States",images/the-sound-and-the-fury.jpg,English,"https://en.wikipedia.org/wiki/The_Sound_and_the_Fury\n",326,"The Sound and the Fury",1929|"Gustave Flaubert",France,images/madame-bovary.jpg,French,"https://en.wikipedia.org/wiki/Madame_Bovary\n",528,"Madame Bovary",1857|"Gustave Flaubert",France,images/l-education-sentimentale.jpg,French,"https://en.wikipedia.org/wiki/Sen
... (truncated)
minemizer
chars: 14,458 tokens: 4,520 chars_og/tok: 6.2 enc_chars/tok: 3.2
<|begin▁of▁sentence|>author; country; imageLink; language; link; pages; title; year
Chinua Achebe; Nigeria; images/things-fall-apart.jpg; English; https://en.wikipedia.org/wiki/Things_Fall_Apart
;·209; Things Fall Apart;·1958
Hans Christian Andersen; Denmark; images/fairy-tales.jpg; Danish; https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.↵
;·784; Fairy tales;·1836
Dante Alighieri; Italy; images/the-divine-comedy.jpg; Italian; https://en.wikipedia.org/wiki/Divine_Comedy
;·928; The Divine Comedy;·1315
Unknown; Sumer and Akkadian Empire; images/the-epic-of-gilgamesh.jpg; Akkadian; https://en.wikipedia.org/wiki/Epic_of_Gilgamesh
;·160; The Epic Of Gilgamesh; -1700
Unknown; Achaemenid Empire; images/the-book-of-job.jpg; Hebrew; https://en.wikipedia.org/wiki/Book_of_Job
;·176; The Book Of Job; -600
Unknown; India/Iran/Iraq/Egypt/Tajikistan; images/one-thousand-and-one-nights.jpg; Arabic; https://en.wikipedia.org/wiki/One_Thousand_and_One_Nights
;·288; One Thousand and One Nights;·1200
Unknown; Iceland; images/njals-saga.jpg; Old Norse; https://en.wikipedia.org/wiki/Nj%C3%A1ls_saga
;·384; Njál's Saga;·1350
Jane Austen; United Kingdom; images/pride-and-prejudice.jpg; English; https://en.wikipedia.org/wiki/Pride_and_Prejudice
;·226; Pride and Prejudice;·1813
Honoré de Balzac; France; images/le-pere-goriot.jpg; French; https://en.wikipedia.org/wiki/Le_P%C3%A8re_Goriot
;·443; Le Père Goriot;·1835
Samuel Beckett; Republic of Ireland; images/molloy-malone-dies-the-unnamable.jpg; French, English; https://en.wikipedia.org/wiki/Molloy_(novel)↵
;·256; Molloy, Malone Dies, The Unnamable, the trilogy;·1952
Giovanni Boccaccio; Italy; images/the-decameron.jpg; Italian; https://en.wikipedia.org/wiki/The_Decameron
;·1024; The Decameron;·1351
Jorge Luis Borges; Argentina; images/ficciones.jpg; Spanish; https://en.wikipedia.org/wiki/Ficciones
;·224; Ficciones;·1965
... (truncated)
minemizer (compact)
chars: 13,753 tokens: 4,387 chars_og/tok: 6.4 enc_chars/tok: 3.1
<|begin▁of▁sentence|>author;country;imageLink;language;link;pages;title;year
Chinua Achebe;Nigeria;images/things-fall-apart.jpg;English;https://en.wikipedia.org/wiki/Things_Fall_Apart
;209;Things Fall Apart;1958
Hans Christian Andersen;Denmark;images/fairy-tales.jpg;Danish;https://en.wikipedia.org/wiki/Fairy_Tales_Told_for_Children._First_Collection.↵
;784;Fairy tales;1836
Dante Alighieri;Italy;images/the-divine-comedy.jpg;Italian;https://en.wikipedia.org/wiki/Divine_Comedy
;928;The Divine Comedy;1315
Unknown;Sumer and Akkadian Empire;images/the-epic-of-gilgamesh.jpg;Akkadian;https://en.wikipedia.org/wiki/Epic_of_Gilgamesh
;160;The Epic Of Gilgamesh;-1700
Unknown;Achaemenid Empire;images/the-book-of-job.jpg;Hebrew;https://en.wikipedia.org/wiki/Book_of_Job
;176;The Book Of Job;-600
Unknown;India/Iran/Iraq/Egypt/Tajikistan;images/one-thousand-and-one-nights.jpg;Arabic;https://en.wikipedia.org/wiki/One_Thousand_and_One_Nights
;288;One Thousand and One Nights;1200
Unknown;Iceland;images/njals-saga.jpg;Old Norse;https://en.wikipedia.org/wiki/Nj%C3%A1ls_saga
;384;Njál's Saga;1350
Jane Austen;United Kingdom;images/pride-and-prejudice.jpg;English;https://en.wikipedia.org/wiki/Pride_and_Prejudice
;226;Pride and Prejudice;1813
Honoré de Balzac;France;images/le-pere-goriot.jpg;French;https://en.wikipedia.org/wiki/Le_P%C3%A8re_Goriot
;443;Le Père Goriot;1835
Samuel Beckett;Republic of Ireland;images/molloy-malone-dies-the-unnamable.jpg;French, English;https://en.wikipedia.org/wiki/Molloy_(novel)↵
;256;Molloy, Malone Dies, The Unnamable, the trilogy;1952
Giovanni Boccaccio;Italy;images/the-decameron.jpg;Italian;https://en.wikipedia.org/wiki/The_Decameron
;1024;The Decameron;1351
Jorge Luis Borges;Argentina;images/ficciones.jpg;Spanish;https://en.wikipedia.org/wiki/Ficciones
;224;Ficciones;1965
... (truncated)
countries.json — Original: 1133948 chars — Tokenizer: deepseek (deepseek-ai/DeepSeek-V3)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)1,133,948402,6262.82.8
JSON (min)787,962304,0933.72.6
CSVN/A
TSVN/A
YAML641,939206,6315.53.1
TOON691,140202,8755.63.4
TSON423,383158,5547.22.7
minemizer323,130120,1159.42.7
minemizer (compact)299,485124,2009.12.4
JSON (pretty)
chars: 1,133,948 tokens: 402,626 chars_og/tok: 2.8 enc_chars/tok: 2.8
<|begin▁of▁sentence|>[↵
· {↵
··· "name": {↵
····· "common": "Aruba",↵
····· "official": "Aruba",↵
····· "native": {↵
······· "nld": {↵
········· "official": "Aruba",↵
········· "common": "Aruba"↵
······· },↵
······· "pap": {↵
········· "official": "Aruba",↵
········· "common": "Aruba"↵
······· }↵
····· }↵
··· },↵
··· "tld": [↵
····· ".aw"↵
··· ],↵
··· "cca2": "AW",↵
··· "ccn3": "533",↵
··· "cca3": "ABW",↵
··· "cioc": "ARU",↵
··· "independent": false,↵
··· "status": "officially-assigned",
... (truncated)
JSON (min)
chars: 787,962 tokens: 304,093 chars_og/tok: 3.7 enc_chars/tok: 2.6
<|begin▁of▁sentence|>[{"name":{"common":"Aruba","official":"Aruba","native":{"nld":{"official":"Aruba","common":"Aruba"},"pap":{"official":"Aruba","common":"Aruba"}}},"tld":[".aw"],"cca2":"AW","ccn3":"533","cca3":"ABW","cioc":"ARU","independent":false,"status":"officially-assigned","unMember":false,"unRegionalGroup":"","currencies":{"AWG":{"name":"Aruban florin","symbol":"\u0192"}},"idd":{"root":"+2","suffixes":["97"]},"capital":["Oranjestad"],"altSpellings":["AW"],"region":"Americas","subregion":"Caribbean","languages":{"nld":"Dutch","pap":"Papiamento"},"translations":{"ara":{"official":"\u0623\u0631\u0648\u0628\u0627","common":"\u0623\u0631\u0648\u0628\u0627"},"bre":{"official":"Aruba","common":"Aruba"},"ces":{"official":"Aruba","common":"Aruba"},"deu":{"official":"Aruba","common":"Aruba"},"est":{"official":"Aruba","common":"Aruba"},"fin":{"official":"Aruba","common":"Aruba"},"fra":{"official":"Aruba","common":"Aruba"},"hrv":{"official":"Aruba","common":"Aruba"},"hun":{"official":"Aruba","common":"Aruba"},"ita":{"official":"Aruba","common":"Aruba"},"jpn":{"official":"\u30a2\u30eb\u30d0","common":"\u30a2\u30eb\u30d0"},"kor":{"official":"\uc544\ub8e8\ubc14","common":"\uc544\ub8e8\ubc14"},"nld":{"official":"Aruba","common":"Aruba"},"per":{"official":"\u0622\u0631\u0648\u0628\u0627","common":"\u0622\u0631\u0648\u0628\u0627"},"pol":{"official":"Aruba","common":"Aruba"},"por":{"official":"Aruba","common":"Aruba"},"rus":{"official":"\u0410\u0440\u0443\u0431\u0430","common":"\u0410\u0440\u0443\u0431\u0430"},"slk":{"official":"Aruba","common":"Aruba"},"spa":{"official":"Aruba","common":"Aruba"},"srp":{"official":"Aruba","common":"Aruba"},"swe":{"official":"Aruba","common":"Aruba"},"tur":{"official":"Aruba","common":"Aruba"},"urd":{"official":"\u0627\u0631\u0648\u0628\u0627","common":"\u0627\u0631\u0648\u0628\u0627"},"zho":{"official":"\u963f\u9c81\u5df4","common":"\u963f\u9c81\u5df4"}},"latlng":[12.5,-69.96666666],"landlocked":false,"borders":[],"area":180,"flag":"\ud83c\udde6\ud83c\uddfc","demonyms":{"eng":{"f":"Aruban","m":"Aruban"},"fra":{"f":"Arubaise","m":"Arubais"}}},{"name":{"common":"Afghanistan","official":"Islamic Republic of Afghanistan","native":{"prs":{"official":"\u062c\u0645\u0647\u0648\u0631\u06cc \u0627\u0633\u0644\u0627\u0645\u06cc \u0627\u0641\u063a\u0627\u0646\u0633\u062a\u0627\u0646","common":"\u0627\u0641\u063a\u0627\u0646\u0633\u062a\u0627\u0646"},"pus":{"official":"\u062f \u0627\u0641\u063a\u0627\u0646\u0633\u062a\u0627\u0646 \u0627\u0633\u0644\u0627\u0645\u064a \u062c\u0645\u0647\u0648\u0631\u06cc\u062a","common":"\u0627\u0641\u063a\u0627\u0646\u0633\u062a\u0627\u0646"},"tuk":{"official":"Owganystan Yslam Respublikasy","common":"Owganystan"}}},"tld":[".af"],"cca2":"AF","ccn3":"004","cca3":"AFG","cioc":"AFG","independent":true,"status":"officially-assigned","unMember":true,"unRegionalGroup":"Asia and the Pacific Group","currencies":{"AFN":{"name":"Afghan afghani","symbol":"\u060b"}},"idd":{"root":"+9","suffixes":["3"]},"capital":["Kabul"],"altSpellings":["AF","Af\u0121\u0101nist\u0101n"],"region":"Asia","subregion":"Southern Asia","languages":{"prs":"Dari","pus":"Pashto","tuk":"Turkmen"},"translations":{"ara":{"official":"\u062c\u0645\u0647\u0648\u0631\u064a\u0629 \u0623\u0641\u0641\u0627\u0646\u0633\u062a\u0627\u0646 \u0627\u0644\u0625\u0633\u0644\u0627\u0645\u064a\u0629","common":"\u0623\u0641\u063a\u0627\u0646\u0633\u062a\u0627\u0646"},"bre":{"official":"Republik Islamek Afghanistan","common":"Afghanistan"},"ces":{"official":"Afgh\u00e1nsk\u00e1 isl\u00e1msk\u00e1 republika","common":"Afgh\u00e1nist\u00e1n"},"deu":{"official":"Islamische Republik Afghanistan","common":"Afghanistan"},"est":{"official":"Afganistani Islamivabariik","common":"Afganistan"},"fin":{"official":"Afganistanin islamilainen tasavalta","common":"Afganistan"},"fra":{"official":"R\u00e9publique islamique d'Afghanistan","common":"Afghanistan"},"hrv":{"official":"Islamska Republika Afganistan","common":"Afganistan"},"hun":{"official":"Afganiszt\u00e1ni Iszl\u00e1m K\u00f6zt\u00e1rsas\u00e1g","common":"Afganiszt\u00e1n"},"ita":{"official":"Repubblica islamica dell'Afghanistan","common":"Afghanistan"},"jpn":{"official":"\u30a2\u30d5\u30ac\u30cb\u30b9\u30bf\u30f3\u30fb\u30a4\u30b9\u30e9\u30e0\u5171\u548c\u56fd","common":"\u30a2\u30d5\u30ac\u30cb\u30b9\u30bf\u30f3"},"kor":{"official":"\uc544\ud504\uac00\ub2c8\uc2a4\ud0c4 \uc774\uc2ac\ub78c \uacf5\ud654\uad6d","common":"\uc544\ud504\uac00\ub2c8\uc2a4\ud0c4"},"nld":{"official":"Islamitische Republiek Afghanistan","common":"Afghanistan"},"per":{"official":"\u062c\u0645\u0647\u0648\u0631\u06cc \u0627\u0633\u0644\u0627\u0645\u06cc \u0627\u0641\u063a\u0627\u0646\u0633\u062a\u0627\u0646","common":"\u0627\u0641\u063a\u0627\u0646\u0633\u062a\u0627\u0646"},"pol":{"official":"Islamska Republika Afganistanu","common":"Afganistan"},"por":{"official":"Rep\u00fablica Isl\u00e2mica do Afeganist\u00e3o","common":"Afeganist\u00e3o"},"rus":{"official":"\u0418\u0441\u043b\u0430\u043c\u0441\u043a\u0430\u044f \u0420\
... (truncated)
CSV: N/A
TSV: N/A
YAML
chars: 641,939 tokens: 206,631 chars_og/tok: 5.5 enc_chars/tok: 3.1
<|begin▁of▁sentence|>- altSpellings:↵
· - AW
· area:·180
· borders: []↵
· capital:↵
· - Oranjestad
· cca2: AW
· cca3: ABW
· ccn3: '533'↵
· cioc: ARU
· currencies:↵
··· AWG:↵
····· name: Aruban florin
····· symbol:
· demonyms:↵
··· eng:↵
····· f: Aruban
····· m: Aruban
··· fra:↵
····· f: Arubaise
····· m: Arubais
· flag:
··idd:↵
··· root: '+2'↵
··· suffixes:
... (truncated)
TOON
chars: 691,140 tokens: 202,875 chars_og/tok: 5.6 enc_chars/tok: 3.4
<|begin▁of▁sentence|>[250]:↵
· -↵
··· name:↵
····· common: Aruba
····· official: Aruba
····· native:↵
······· nld:↵
········· official: Aruba
········· common: Aruba
······· pap:↵
········· official: Aruba
········· common: Aruba
··· tld[1]: .aw
··· cca2: AW
··· ccn3: "533"↵
··· cca3: ABW
··· cioc: ARU
··· independent: false
··· status: officially-assigned
··· unMember: false
··· unRegionalGroup: ""↵
··· currencies:↵
····· AWG:↵
······· name: Aruban florin
······· symbol:
... (truncated)
TSON
chars: 423,383 tokens: 158,554 chars_og/tok: 7.2 enc_chars/tok: 2.7
<|begin▁of▁sentence|>{@name(@common,official,native),tld,cca2,ccn3,cca3,cioc,independent,status,unMember,unRegionalGroup,currencies,idd(@root,suffixes),capital,altSpellings,region,subregion,languages,translations(@ara,bre,ces,deu,est,fin,fra,hrv,hun,ita,jpn,kor,nld,per,pol,por,rus,slk,spa,srp,swe,tur,urd,zho),latlng,landlocked,borders,area,flag,demonyms(@eng,fra)#250|{Aruba,Aruba,{@nld,pap|{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba}}},[.aw],AW,"533",ABW,ARU,false,officially-assigned,false,"",{@AWG|{@name,symbol|"Aruban florin",ƒ}},{"+2",["97"]},[Oranjestad],[AW],Americas,Caribbean,{@nld,pap|Dutch,Papiamento},{{@official,common|أروبا,أروبا},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|アル,アル},{@official,common|,},{@official,common|Aruba,Aruba},{@official,common|آروبا,آروبا},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Аруба,Аруба},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|Aruba,Aruba},{@official,common|اروبا,اروبا},{@official,common|,}},[12.5,-69.96666666],false,[],180,,{{@f,m|Aruban,Aruban},{@f,m|Arubaise,Arubais}}|{Afghanistan,"Islamic Republic of Afghanistan",{@prs,pus,tuk|{@official,common|"جمهوری اسلامی افغانستان",افغانستان},{@official,common|"د افغانستان اسلامي جمهوریت",افغانستان},{@official,common|"Owganystan Yslam Respublikasy",Owganystan}}},[.af],AF,"004",AFG,AFG,true,officially-assigned,true,"Asia and the Pacific Group",{@AFN|{@name,symbol|"Afghan afghani",}},{"+9",["3"]},[Kabul],[AF,Afānistān],Asia,"Southern Asia",{@prs,pus,tuk|Dari,Pashto,Turkmen},{{@official,common|"جمهورية أففانستان الإسلامية",أفغانستان},{@official,common|"Republik Islamek Afghanistan",Afghanistan},{@official,common|"Afghánská isms republika",Afghánistán},{@official,common|"Islamische Republik Afghanistan",Afghanistan},{@official,common|"Afganistani Islamivabariik",Afganistan},{@official,common|"Afganistanin islamilainen tasavalta",Afganistan},{@official,common|"République islamique d'Afghanistan",Afghanistan},{@official,common|"Islamska Republika Afganistan",Afganistan},{@official,common|"Afganisztáni Iszlámztársaság",Afganisztán},{@official,common|"Repubblica islamica dell'Afghanistan",Afghanistan},{@official,common|スタ共和国,スタ},{@official,common|"",},{@official,common|"Islamitische Republiek Afghanistan",Afghanistan},{@official,common|"جمهوری اسلامی افغانستان",افغانستان},{@official,common|"Islamska Republika Afganistanu",Afganistan},{@official,common|"República Islâmica do Afeganistão",Afeganistão},{@official,common|"Исламская Республика Афганистан",Афганистан},{@official,common|"Afgánsky islamský štát",Afganistan},{@official,common|"República Islámica de Afganistán",Afganistán},{@official,common|"Islamska Republika Avganistan",Avganistan},{@official,common|"Islamiska republiken Afghanistan",Afghanistan},{@official,common|"Afganistan İslam Cumhuriyeti",Afganistan},{@official,common|"اسلامی جمہوریہ افغانستان",افغانستان},{@official,common|阿富汗伊斯兰共和国,阿富汗}},[33,65],true,[IRN,PAK,TKM,UZB,TJK,CHN],652230,,{{@f,m|Afghan,Afghan},{@f,m|Afghane,Afghan}}|{Angola,"Republic of Angola",{@por|{@official,common|"República de Angola",Angola}}},[.ao],AO,"024",AGO,ANG,true,officially-assigned,true,"African Group",{@AOA|{@name,symbol|"Angolan kwanza",Kz}},{"+2",["44"]},[Luanda],[AO,"República de Angola","ʁɛpublika de an'ɡɔla"],Africa,"Middle Africa",{@por|Portuguese},{{@official,common|أنغولا,"جمهورية أنغولا"},{@official,common|"Republik Angola",Angola},{@official,common|"Angolská republika",Angola},{@official,common|"Republik Angola",Angola},{@official,common|"Angola Vabariik",Angola},{@official,common|"Angolan tasavalta",Angola},{@official,common|"République d'Angola",Angola},{@official,common|"Republika Angola",Angola},{@official,common|Angola,Angola},{@official,common|"Repubblica dell'Angola",Angola},{@official,common|共和国,},{@official,common|"",},{@official,common|"Republiek Angola",Angola},{@official,common|"جمهوری آنگولا",آنگولا},{@official,common|"Republika Angoli",Angola},{@official,common|"República de Angola",Angola},{@official,common|"Республика Ангола",Ангола},{@official,common|"Angolská republika",Angola},{@official,common|"República de Angola",Angola},{@official,common|"Republika Angola",Angola},{@official,common|"Republiken Angola",Angola},{@official,common|"Angola Cumhuriyeti",Angola},{@official,common|"جمہوریہ انگولہ",انگولہ},{@official,common|共和国,}},[-12.5,18.5],false,[COG,COD,ZMB,NAM],1246700,,{{@f,m|Angolan,Angolan},{@f,m|Angolaise,Angolais}}|{Anguilla,Anguilla,{@eng|{@official,common|Anguilla,Anguilla}}},[.ai],AI,"660",AIA,"",false,officially-assigned,false,"",{@XCD
... (truncated)
minemizer
chars: 323,130 tokens: 120,115 chars_og/tok: 9.4 enc_chars/tok: 2.7
<|begin▁of▁sentence|>name{ common; official; native{ ...}}; tld[]; cca2; ccn3; cca3; cioc; independent; status; unMember; unRegionalGroup; currencies{ ...};·idd{ root; suffixes[]}; capital[]; altSpellings[]; region; subregion; languages{ ...}; translations{ ara{ official; common}; bre{ official; common}; ces{ official; common}; deu{ official; common}; est{ official; common}; fin{ official; common}; fra{ official; common}; hrv{ official; common}; hun{ official; common}; ita{ official; common}; jpn{ official; common}; kor{ official; common}; nld{ official; common}; per{ official; common}; pol{ official; common}; por{ official; common}; rus{ official; common}; slk{ official; common}; spa{ official; common}; srp{ official; common}; swe{ official; common}; tur{ official; common}; urd{ official; common}; zho{ official; common}}; latlng[]; landlocked; borders[]; area; flag; demonyms{ eng{ f; m}; fra{ f; m}}↵
{ Aruba; Aruba;{ nld:{ official: Aruba; common: Aruba}; pap:{ official: Aruba; common: Aruba}}};[ .aw]; AW;·533; ABW; ARU;false; officially-assigned;false;;{ AWG:{ name: Aruban florin; symbol:}};{ +2;[·97]};[ Oranjestad];[ AW]; Americas; Caribbean;{ nld: Dutch; pap: Papiamento};{{ أروبا; أروبا};{ Aruba; Aruba};{ Aruba; Aruba};{ Aruba; Aruba};{ Aruba; Aruba};{ Aruba; Aruba};{ Aruba; Aruba};{ Aruba; Aruba};{ Aruba; Aruba};{ Aruba; Aruba};{·アル;·アル};{;};{ Aruba; Aruba};{ آروبا; آروبا};{ Aruba; Aruba};{ Aruba; Aruba};{ Аруба; Аруба};{ Aruba; Aruba};{ Aruba; Aruba};{ Aruba; Aruba};{ Aruba; Aruba};{ Aruba; Aruba};{ اروبا; اروبا};{·;·}};[·12.5; -69.96666666];false;[];·180;;{{ Aruban; Aruban};{ Arubaise; Arubais}}↵
{ Afghanistan; Islamic Republic of Afghanistan;{ prs:{ official: جمهوری اسلامی افغانستان; common: افغانستان}; pus:{ official: د افغانستان اسلامي جمهوریت; common: افغانستان}; tuk:{ official: Owganystan Yslam Respublikasy; common: Owganystan}}};[ .af]; AF;·004; AFG; AFG;true; officially-assigned;true; Asia and the Pacific Group;{ AFN:{ name: Afghan afghani; symbol:}};{ +9;[·3]};[ Kabul];[ AF; Afānistān]; Asia; Southern Asia;{ prs: Dari; pus: Pashto; tuk: Turkmen};{{ جمهورية أففانستان الإسلامية; أفغانستان};{ Republik Islamek Afghanistan; Afghanistan};{ Afghánská isms republika; Afghánistán};{ Islamische Republik Afghanistan; Afghanistan};{ Afganistani Islamivabariik; Afganistan};{ Afganistanin islamilainen tasavalta; Afganistan};{ République islamique d'Afghanistan; Afghanistan};{ Islamska Republika Afganistan; Afganistan};{ Afganisztáni Iszlámztársaság; Afganisztán};{ Repubblica islamica dell'Afghanistan; Afghanistan};{·スタ共和国;·スタ};{;};{ Islamitische Republiek Afghanistan; Afghanistan};{ جمهوری اسلامی افغانستان; افغانستان};{ Islamska Republika Afganistanu; Afganistan};{ República Islâmica do Afeganistão; Afeganistão};{ Исламская Республика Афганистан; Афганистан};{ Afgánsky islamský štát; Afganistan};{ República Islámica de Afganistán; Afganistán};{ Islamska Republika Avganistan; Avganistan};{ Islamiska republiken Afghanistan; Afghanistan};{ Afganistan İslam Cumhuriyeti; Afganistan};{ اسلامی جمہوریہ افغانستان; افغانستان};{·阿富汗伊斯兰共和国;·阿富汗}};[·33;·65];true;[ IRN; PAK; TKM; UZB; TJK; CHN];·652230;;{{ Afghan; Afghan};{ Afghane; Afghan}}↵
{ Angola; Republic of Angola;{ por:{ official: República de Angola; common: Angola}}};[ .ao]; AO;·024; AGO; ANG;true; officially-assigned;true; African Group;{ AOA:{ name: Angolan kwanza; symbol: Kz}};{ +2;[·44]};[ Luanda];[ AO; República de Angola;·ʁɛpublika de an'ɡɔla]; Africa; Middle Africa;{ por: Portuguese};{{ أنغولا; جمهورية أنغولا};{ Republik Angola; Angola};{ Angolská republika; Angola};{ Republik Angola; Angola};{ Angola Vabariik; Angola};{ Angolan tasavalta; Angola};{ République d'Angola; Angola};{ Republika Angola; Angola};{ Angola; Angola};{ Repubblica dell'Angola; Angola};{·共和国;·};{;};{ Republiek Angola; Angola};{ جمهوری آنگولا; آنگولا};{ Republika Angoli; Angola};{ República de Angola; Angola};{ Республика Ангола; Ангола};{ Angolská republika; Angola};{ República de Angola; Angola};{ Republika Angola; Angola};{ Republiken Angola; Angola};{ Angola Cumhuriyeti; Angola};{ جمہوریہ انگولہ; انگولہ};{·共和国;·}};[ -12.5;·18.5];false;[ COG; COD; ZMB; NAM];·1246700;;{{ Angolan; Angolan};{ Angolaise; Angolais}}↵
{ Anguilla; Anguilla;{ eng:{ official: Anguilla; common: Anguilla}}};[ .ai]; AI;·660; AIA;;false; officially-assigned;false;;{ XCD:{ name: Eastern Caribbean dollar; symbol: $}};{ +1;[·264]};[ The Valley];[ AI]; Americas; Caribbean;{ eng: English};{{ أنغويلا; أنغويلا};{ Anguilla; Anguilla};{ Anguilla; Anguilla};{ Anguilla; Anguilla};{ Anguilla; Anguilla};{ Anguilla; Anguilla};{ Anguilla; Anguilla};{ Anguilla; Angvila};{ Anguilla; Anguilla};{ Anguilla; Anguilla};{·;·};{;};{ Anguilla; Anguilla};{ آنگویلا; آنگویلا};{ Anguilla; Anguilla};{ Anguilla; Anguilla};{ Ангилья; Ангилья};{ Anguilla; Anguilla};{ Anguila; Anguilla};{ Angvila; Angvila};{ Anguilla; Anguilla};{ Anguilla; Anguilla};{ اینگویلا; اینگویلا};{·;·}};[·18.25; -63.16666666];false;[];·91;;{{ Anguillian; Anguillian};{ Anguillane; Anguillan}}↵
{ Åland Islands; Åland Islands;{ swe:{ official: Landskapet Åland; common: Åland}}};[ .ax]; AX;·248; ALA;;false; officially-assigned;false;;{ EUR:{ name: Euro; symbol:}};{ +3;[·5818]};[ Mariehamn];[ AX; Aaland; Aland; Ahvenanmaa]; Europe; Northern Europe;{ swe: Swedish};{{ جزر أولاند; جزر أولاند};{ Inizi Åland; Åland};{ Ålandské ostrovy; Ålandy};{ Åland-Inseln; Åland};{ Ahvenamaa maakond; Ahvenamaa};{ Ahvenanmaan maakunta; Ahvenanmaa};{ Ahvenanmaa; Ahvenanmaa};{ Aland Islands; Ålandski otoci};{ Åland-szigetek; Åland-szigetek};{ Isole Åland; Isole Aland};{·ンド;·ンド};{;};{ Åland eilanden; Ålandeilanden};{ جزایر الند; جزایر الند};{ Wyspy Alandzkie; Wyspy Alandzkie};{ Ilhas Åland; Alândia};{ Аландские острова; Аландские острова};{ Alandské ostrovy; Alandy};{ Islas Åland; Alandia};{ Olandska Ostrva; Olandska Ostrva};{ Åland; Åland};{ Åland Adaları; Åland};{ جزائر اولند; جزائر اولند};{·群岛;·群岛}};[·60.116667;·19.9];false;[];·1580;;{{ Ålandish; Ålandish};{ Ålandaise; Ålandais}}↵
{ Albania; Republic of Albania;{ sqi:{ official: Republika e Shqipërisë; common: Shqipëria}}};[ .al]; AL;·008; ALB; ALB;true; officially-assigned;true; Eastern European Group;{ ALL:{ name: Albanian lek; symbol: L}};{ +3;[·55]};[ Tirana];[ AL; Shqipëri; Shqipëria; Shqipnia]; Europe; Southeast Europe;{ sqi: Albanian};{{ جمهورية ألبانيا; ألبانيا};{ Republik Albania; Albania};{ Albánská republika; Albánie};{ Republik Albanien; Albanien};{ Albaania Vabariik; Albaania};{ Albanian tasavalta; Albania};{ République d'Albanie; Albanie};{ Republika Albanija; Albanija};{ Albánztársaság; Albánia};{ Repubblica d'Albania; Albania};{·アルニア共和国;·アルニア};{;};{ Republiek Alban; Alban};{ جمهوری آلبانی; آلبانی};{ Republika Albanii; Albania};{ República da Albânia; Albânia};{ Республика Албания; Албания};{ Albánska republika; Albánsko};{ República de Albania; Albania};{ Republika Albanija; Albanija};{ Republiken Albanien; Albanien};{ Arnavutluk Cumhuriyeti; Arnavutluk};{ جمہوریہ البانیا; البانیا};{·阿尔尼亚共和国;·阿尔尼亚}};[·41;·20];false;[ MNE; GRC; MKD; UNK];·28748;;{{ Albanian; Albanian};{ Albanaise; Albanais}}↵
{ Andorra; Principality of Andorra;{ cat:{ official: Principat d'Andorra; common: Andorra}}};[ .ad]; AD;·020; AND; AND;true; officially-assigned;true; Western European and Others Group;{ EUR:{ name: Euro; symbol:}};{ +3;[·76]};[ Andorra la Vella];[ AD; Principality of Andorra; Principat d'Andorra]; Europe; Southern Europe;{ cat: Catalan};{{ إمارة أندورا; أندورا};{ Priñselezh Andorra; Andorra};{ Andorrské kžect; Andorra};{ Fürstentum Andorra; Andorra};{ Andorra Vürstiriik; Andorra};{ Andorran ruhtinaskunta; Andorra};{ Principauté d'Andorre; Andorre};{ Kneževina Andora; Andora};{ Andorra; Andorra};{ Principato di Andorra; Andorra};{·ンド;·ンド};{;};{ Prinsdom Andorra; Andorra};{ شاهزادهنشین آندورا; آندورا};{ Księstwo Andory; Andora};{ Principado de Andorra; Andorra};{ Княжество Андорра; Андорра};{ Andorrské kniežatstvo; Andorra};{ Principado de Andorra; Andorra};{ Kneževina Andora; Andora};{ Furstendömet Andorra; Andorra};{ Andorra Prensliği; Andorra};{ اماراتِ انڈورا; انڈورا};{·;·}};[·42.5;·1.5];true;[ FRA; ESP];·468;;{{ Andorran; Andorran};{ Andorrane; Andorran}}↵
{ United Arab Emirates; United Arab Emirates;{ ara:{ official: الإمارات العربية المتحدة; common: الإمارات}}};[ .ae; امارات.]; AE;·784; ARE; UAE;true; officially-assigned;true; Asia and the Pacific Group;{ AED:{ name: United Arab Emirates dirham; symbol: د.إ}};{ +9;[·71]};[ Abu Dhabi];[ AE; UAE; Emirates]; Asia; Western Asia;{ ara: Arabic};{{ الإمارات العربية المتحدة; الإمارات};{ Emirelezhioù Arab Unanet; Emirelezhioù Arab Unanet};{ Spojené arabs emiráty; Spojené arabs emiráty};{ Vereinigte Arabische Emirate; Vereinigte Arabische Emirate};{ Araabia Ühendemiraadid; Araabia Ühendemiraadid};{ Yhdistyneet arabiemiirikunnat; Arabiemiraatit};{ Émirats arabes unis; Émirats arabes unis};{ Ujedinjeni Arapski Emirati; Ujedinjeni Arapski Emirati};{ Egyesült Arab Emírségek; Egyesült Arab Emírségek};{ Emirati Arabi Uniti; Emirati Arabi Uniti};{·; UAE};{;};{ Verenigde Arabische Emiraten; Verenigde Arabische Emiraten};{ امارات متحده عربی; امارات};{ Zjednoczone Emiraty Arabskie; Zjednoczone Emiraty Arabskie};{ Emirados Árabes Unidos; Emirados Árabes Unidos};{ Объединенные Арабские Эмираты; Объединённые Арабские Эмираты};{ Spojené arabs emiráty; Spojené arabs emiráty};{ Emiratos Árabes Unidos; Emiratos Árabes Unidos};{ Ujedinjeni Arapski Emirati; Ujedinjeni Arapski Emirati};{ Förenade Arabemiraten; Förenade Arabemiraten};{ Birleşik Arap Emirlikleri; Birleşik Arap Emirlikleri};{ متحدہ عرب امارات; متحدہ عرب امارات};{·阿拉伯联合;·阿拉伯联合}};[·24;·54];false;[ OMN; SAU];·83600;;{{ Emirati; Emirati};{ Emirienne; Emirien}}↵
{ Argentina; Argentine Republic;{ grn:{ official: Argentine Republic; common: Argentina}; spa:{ official: República Argentina; common: Argentina}}};[ .ar]; AR;·032; ARG; ARG;true; officially-assigned;true; Latin American and Caribbean Group;{ ARS:{ name: Argentine peso; symbol: $}};{ +5;[·4]};[ Buenos Aires];[ AR; Argentine Republic; República Argentina]; Americas; South America;{ grn: Guaraní; spa: Spanish};{{ جمهورية الأرجنتين; الأرجنتين};{ Republik Arc'hantina; Arc'hantina};{ Argentins republika; Argentina};{ Argentinische Republik; Argentinien};{ Argentina Vabariik; Argentina};{ Argentiinan tasavalta; Argentiina};{ République argentine; Argentine};{ Argentinski Republika; Argentina};{ Argentinztársaság; Argentína};{ Repubblica Argentina; Argentina};{·アルンチ共和国;·アルンチ};{;};{ Argentijnse Republiek; Argentinië};{ جمهوری آرژانتین; آرژانتین};{ Republika Argentyńska; Argentyna};{ República Argentina; Argentina};{ Аргентинская Республика; Аргентина};{ Argentínska republika; Argentína};{ República Argentina; Argentina};{ Republika Argentina; Argentina};{ Republiken Argentina; Argentina};{ Arjantin Cumhuriyeti; Arjantin};{ جمہوریہ ارجنٹائن; ارجنٹائن};{·阿根廷共和国;·阿根廷}};[ -34; -64];false;[ BOL; BRA; CHL; PRY; URY];·2780400;;{{ Argentine; Argentine};{ Argentine; Argentin}}↵
{ Armenia; Republic of Armenia;{ hye:{ official: Հայաստանի Հանրապետություն; common: Հայաստան}}};[ .am]; AM;·051; ARM; ARM;true; officially-assigned;true; Eastern European Group;{ AMD:{ name: Armenian dram; symbol:}};{ +3;[·74]};[ Yerevan];[ AM; Hayastan; Republic of Armenia; Հայաստանի Հանրապետություն]; Asia; Western Asia;{ hye: Armenian};{{ جمهورية أرمينيا; أرمينيا};{ Republik Armenia; Armenia};{ Arménská republika; Arménie};{ Republik Armenien; Armenien};{ Armeenia Vabariik; Armeenia};{ Armenian tasavalta; Armenia};{ République d'Arménie; Arménie};{ Republika Armenija; Armenija};{ Örményország; Örményország};{ Repubblica di Armenia; Armenia};{·アルニア共和国;·アルニア};{;};{ Republiek Armen; Armen};{ جمهوری ارمنستان; ارمنستان};{ Republika Armenii; Armenia};{ República da Arménia; Arménia};{ Республика Армения; Армения};{ Arménska republika; Arménsko};{ República de Armenia; Armenia};{ Republika Jermenija; Jermenija};{ Republiken Armenien; Armenien};{ Ermenistan Cumhuriyeti; Ermenistan};{ جمہوریہ آرمینیا; آرمینیا};{·尼亚共和国;·尼亚}};[·40;·45];true;[ AZE; GEO; IRN; TUR];·29743;;{{ Armenian; Armenian};{ Arménienne; Arménien}}↵
{ American Samoa; American Samoa;{ eng:{ official: American Samoa; common: American Samoa}; smo:{ official: Sāmoa Amelika; common: Sāmoa Amelika}}};[ .as]; AS;·016; ASM; ASA;false; officially-assigned;false;;{ USD:{ name: United States dollar; symbol: $}};{ +1;[·684]};[ Pago Pago];[ AS; Amerika Sāmoa; Amelika Sāmoa; Sāmoa Amelika]; Oceania; Polynesia;{ eng: English; smo: Samoan};{{ ساموا الأمريكية; ساموا الأمريكية};{ Samoa Amerikan; Samoa Amerikan};{ Americká Samoa; Americká Samoa};{ Amerikanisch-Samoa; Amerikanisch-Samoa};{ Ameerika Samoa; Ameerika Samoa};{ Amerikan Samoa; Amerikan Samoa};{ Samoa américaines; Samoa américaines};{ amerka Samoa; Amerka Samoa};{ Szamoa; Szamoa};{ Samoa americane; Samoa Americane};{·;·アメリカ};{;};{ Amerikaans Samoa; Amerikaans Samoa};{ ساموآی آمریکا; ساموآی آمریکا};{ Samoa Amerykańskie; Samoa Amerykańskie};{ Samoa americana; Samoa Americana};{ американское Самоа; Американское Самоа};{ Americká Samoa; Americká Samoa};{ Samoa Americana; Samoa Americana};{ Amerka Samoa; Amerka Samoa};{ Amerikanska Samoa; Amerikanska Samoa};{ Amerikan Samoası; Amerikan Samoası};{ امریکی سمووا; امریکی سمووا};{·;·}};[ -14.33333333; -170];false;[];·199;;{{ American Samoan; American Samoan};{ Samoane; Samoan}}↵
{ Antarctica; Antarctica;{}};[ .aq]; AQ;·010; ATA;;false; officially-assigned;false;;{};{;[]};[];[ AQ]; Antarctic;;{};{{ أنتارتيكا; أنتارتيكا};{ Antarktika; Antarktika};{ Antarktida; Antarktida};{ Antarktika; Antarktis};{ Antarktika; Antarktika};{ Etelämanner; Etelämanner};{ Antarctique; Antarctique};{ Antarktika; Antarktika};{ Antarktisz; Antarktisz};{ Antartide; Antartide};{·;·大陸};{;};{ Antarctica; Antarctica};{ جنوبگان; جنوبگان};{ Antarktyka; Antarktyka};{ Antártica; Antártida};{ Антарктида; Антарктида};{ Antarktída; Antarktída};{ Antártida; Antártida};{ Antarktik; Antarktik};{ Antarktis; Antarktis};{ Antarktika; Antarktika};{ انٹارکٹکا; انٹارکٹکا};{·南极;·南极}};[ -90;·0];false;[];·14000000;;{{ Antarctican; Antarctican};{ Antarcticaine; Antarcticain}}↵
{ French Southern and Antarctic Lands; Territory of the French Southern and Antarctic Lands;{ fra:{ official: Territoire des Terres australes et antarctiques françaises; common: Terres australes et antarctiques françaises}}};[ .tf]; TF;·260; ATF;;false; officially-assigned;false;;{ EUR:{ name: Euro; symbol:}};{ +2;[·62]};[ Port-aux-Français];[ TF; French Southern Territories]; Antarctic;;{ fra: French};{{ مقاطعات وأقاليم ما وراء البحار الفرنسية; أراض فرنسية جنوبية وأنتارتيكية};{ Tiriad Douaroù Aostral hag Antarktikel Frañs; Douaroù Aostral hag Antarktikel Frañs};{ Teritorium Francouzská již a antarktická území; Francouzská již a antarktická území};{ Gebiet der Französisch Süd- und Antarktisgebiete; Französische Süd- und Antarktisgebiete};{ Prantsuse Lõunaalad; Prantsuse Lõunaalad};{ Ranskan eteläiset ja antarktiset alueet; Ranskan eteläiset ja antarktiset alueet};{ Territoire des Terres australes et antarctiques françaises; Terres australes et antarctiques françaises};{ Teritoriju Francuski južni i antarktički teritoriji; Francuski južni i antarktički teritoriji};{ Franciali és antarktiszi területek; Franciali és antarktiszi területek};{ Territorio della australi e antartiche francesi Terre; Territori Francesi del Sud};{·ランス;·ランス南方地域};{ 지역; 지역};{ Grondgebied van de Franse Zuidelijke en Antarctische gebieden; Franse Gebieden in de zuidelijke Indische Oceaan};{ سرزمینهای جنوبی و جنوبگانی فرانسه; سرزمینهای جنوبی و جنوبگانی فرانسه};{ Francuskie Terytoria Południowe i Antarktyczne; Francuskie Terytoria Południowe i Antarktyczne};{ Território do Sul e Antártica Francesa; Terras Austrais e Antárticas Francesas};{ Территория Французские Южные и Антарктические земли; Французские Южные и Антарктические территории};{ Francúzske juž a antarktické územia; Francúzske juŽ a antarktické územia};{ Territorio del Francés Tierras australes y antárticas; Tierras Australes y Antárticas Francesas};{ Francuske južne i antarktičke zemlje; Francuske južne i antarktičke zemlje};{ Franska syd- och Antarktisterritorierna; Franska södra territorierna};{ Fransızney ve Antarktika Toprakları; Fransızney ve Antarktika Toprakları};{ سرزمینِ جنوبی فرانسیسیہ و انٹارکٹیکہ; سرزمین جنوبی فرانسیسیہ و انٹارکٹیکا};{·法国南部南极土地;·法国南部南极土地}};[ -49.25;·69.167];false;[];·7747;;{{ French; French};{ Française; Français}}↵
{ Antigua and Barbuda; Antigua and Barbuda;{ eng:{ official: Antigua and Barbuda; common: Antigua and Barbuda}}};[ .ag]; AG;·028; ATG; ANT;true; officially-assigned;true; Latin American and Caribbean Group;{ XCD:{ name: Eastern Caribbean dollar; symbol: $}};{ +1;[·268]};[ Saint John's];[ AG]; Americas; Caribbean;{ eng: English};{{ أنتيغوا وباربودا; أنتيغوا وباربودا};{ Antigua ha Barbuda; Antigua ha Barbuda};{ Antigua a Barbuda; Antigua a Barbuda};{ Antigua und Barbuda; Antigua und Barbuda};{ Antigua ja Barbuda; Antigua ja Barbuda};{ Antigua ja Barbuda; Antigua ja Barbuda};{ Antigua -et-Barbuda; Antigua-et-Barbuda};{ Antigva i Barbuda; Antigva i Barbuda};{ Antigua és Barbuda; Antigua és Barbuda};{ Antigua e Barbuda; Antigua e Barbuda};{·ン��ィーブー�;·ン��ィーブー�};{;};{ Antigua en Barbuda; Antigua en Barbuda};{ آنتیگوا و باربودا; آنتیگوا و باربودا};{ Antigua i Barbuda; Antigua i Barbuda};{ Antigua e Barbuda; Antígua e Barbuda};{ Антигуа и Барбуда; Антигуа и Барбуда};{ Antigua a Barbuda; Antigua a Barbuda};{ Antigua y Barbuda; Antigua y Barbuda};{ Antigva i Barbuda; Antigva i Barbuda};{ Antigua och Barbuda; Antigua och Barbuda};{ Antigua ve Barbuda; Antigua ve Barbuda};{ اینٹیگوا و باربوڈا; اینٹیگوا و باربوڈا};{·;·}};[·17.05; -61.8];false;[];·442;;{{ Antiguan, Barbudan; Antiguan, Barbudan};{ Antiguaise et barbudienne; Antiguaise et barbudien}}↵
{ Australia; Commonwealth of Australia;{ eng:{ official: Commonwealth of Australia; common: Australia}}};[ .au]; AU;·036; AUS; AUS;true; officially-assigned;true; Western European and Others Group;{ AUD:{ name: Australian dollar; symbol: $}};{ +6;[·1]};[ Canberra];[ AU]; Oceania; Australia and New Zealand;{ eng: English};{{ كومونولث أستراليا; أستراليا};{ Kenglad Aostralia; Aostralia};{ Australs společenství; Austrálie};{ Commonwealth Australien; Australien};{ Austraalia Ühendus; Austraalia};{ Australian liittovaltio; Australia};{ Australie; Australie};{ Commonwealth of Australia; Australija};{ Ausztrál Államszövetség; Ausztrália};{ Commonwealth dell'Australia; Australia};{·ストリア;·ストリア};{스트리아;};{ Gemenebest van Austral; Austral};{ قلمرو همسود استرالیا; استرالیا};{ Związek Australijski; Australia};{ Comunidade da Austrália; Austrália};{ Содружество Австралии; Австралия};{ Austrálsky zz; Austrália};{ Mancomunidad de Australia; Australia};{ Komonvelt Australija; Australija};{ Australiska statsförbundet; Australien};{ Avustralya Federal Devleti; Avustralya};{ دولتِ مشترکہ آسٹریلیا; آسٹریلیا};{·澳大利亚联邦;·澳大利亚}};[ -27;·133];false;[];·7692024;;{{ Australian; Australian};{ Australienne; Australien}}↵
{ Austria; Republic of Austria;{ bar:{ official: Republik Österreich; common: Österreich}}};[ .at]; AT;·040; AUT; AUT;true; officially-assigned;true; Western European and Others Group;{ EUR:{ name: Euro; symbol:}};{ +4;[·3]};[ Vienna];[ AT; Osterreich; Oesterreich]; Europe; Central Europe;{ bar: Austro-Bavarian German};{{ جمهورية النمسا; النمسا};{ Republik Aostria; Aostria};{ Rakous republika; Rakousko};{ Republik Österreich; Österreich};{ Austria Vabariik; Austria};{ Itävallan tasavalta; Itävalta};{ République d'Autriche; Autriche};{ Republika Austrija; Austrija};{ Ausztria; Ausztria};{ Repubblica d'Austria; Austria};{·ストリア共和国;·ストリア};{스트리아;스트리아};{ Republiek Oostenrijk; Oostenrijk};{ جمهوری اتریش; اتریش};{ Republika Austrii; Austria};{ República da Áustria; Áustria};{ Австрийская Республика; Австрия};{ Rakúska republika; Rakúsko};{ República de Austria; Austria};{ Republika Austrija; Austrija};{ Republiken Österrike; Österrike};{ Avusturya Cumhuriyeti; Avusturya};{ جمہوریہ آسٹریا; آسٹریا};{·奥地利共和国;·奥地利}};[·47.33333333;·13.33333333];true;[ CZE; DEU; HUN; ITA; LIE; SVK; SVN; CHE];·83871;;{{ Austrian; Austrian};{ Autrichienne; Autrichien}}↵
{ Azerbaijan; Republic of Azerbaijan;{ aze:{ official: Azərbaycan Respublikası; common: Azərbaycan}; rus:{ official: Азербайджанская Республика; common: Азербайджан}}};[ .az]; AZ;·031; AZE; AZE;true; officially-assigned;true; Eastern European Group;{ AZN:{ name: Azerbaijani manat; symbol:}};{ +9;[·94]};[ Baku];[ AZ; Republic of Azerbaijan; Azərbaycan Respublikası]; Asia; Western Asia;{ aze: Azerbaijani; rus: Russian};{{ جمهورية أذربيجان; أذربيجان};{ Republik Azerbaidjan; Azerbaidjan};{ Ázerbájdžánská republika; Ázerbájdžán};{ Republik Aserbaidschan; Aserbaidschan};{ Aserbaidžaani Vabariik; Aserbaidžaan};{ Azerbaidzanin tasavalta; Azerbaidzan};{ République d'Azerbaïdjan; Azerbaïdjan};{ Republika Azerbajdžan; Azerbajdžan};{ Azerbajdzsán; Azerbajdzsán};{ Repubblica dell'Azerbaigian; Azerbaijan};{·バイジャ共和国;·バイジャ};{;};{ Republiek Azerbeidzjan; Azerbeidzjan};{ جمهوری آذربایجان; جمهوری آذربایجان};{ Republika Azerbejdżanu; Azerbejdżan};{ República do Azerbaijão; Azerbeijão};{ Азербайджанская Республика; Азербайджан};{ Azerbajanská republika; Azerbajan};{ República de Azerbaiyán; Azerbaiyán};{ Republika Azerbejdžan; Azerbejdžan};{ Republiken Azerbajdzjan; Azerbajdzjan};{ Azerbaycan Cumhuriyeti; Azerbaycan};{ جمہوریہ آذربائیجان; آذربائیجان};{·共和国;·}};[·40.5;·47.5];true;[ ARM; GEO; IRN; RUS; TUR];·86600;;{{ Azerbaijani; Azerbaijani};{ Azerbaïdjanaise; Azerbaïdjanais}}↵
{ Burundi; Republic of Burundi;{ fra:{ official: République du Burundi; common: Burundi}; run:{ official: Republika y'Uburundi ; common: Uburundi}}};[ .bi]; BI;·108; BDI; BDI;true; officially-assigned;true; African Group;{ BIF:{ name: Burundian franc; symbol: Fr}};{ +2;[·57]};[ Gitega];[ BI; Republic of Burundi; Republika y'Uburundi; République du Burundi]; Africa; Eastern Africa;{ fra: French; run: Kirundi};{{ جمهورية بوروندي; بوروندي};{ Republik Burundi; Burundi};{ Burundská republika; Burundi};{ Republik Burundi; Burundi};{ Burundi Vabariik; Burundi};{ Burundin tasavalta; Burundi};{ République du Burundi; Burundi};{ Burundi; Burundi};{ Burundi; Burundi};{ Repubblica del Burundi; Burundi};{·ブルンジ共和国;·ブルンジ};{;};{ Republiek Burundi; Burundi};{ جمهوری بوروندی; بوروندی};{ Republika Burundi; Burundi};{ República do Burundi; Burundi};{ Республика Бурунди; Бурунди};{ Burundská republika; Burundi};{ República de Burundi; Burundi};{ Republika Burundi; Burundi};{ Republiken Burundi; Burundi};{ Burundi Cumhuriyeti; Burundi};{ جمہوریہ برونڈی; برونڈی};{·共和国;·}};[ -3.5;·30];true;[ COD; RWA; TZA];·27834;;{{ Burundian; Burundian};{ Burundaise; Burundais}}↵
{ Belgium; Kingdom of Belgium;{ deu:{ official: Königreich Belgien; common: Belgien}; fra:{ official: Royaume de Belgique; common: Belgique}; nld:{ official: Koninkrijk België; common: België}}};[ .be]; BE;·056; BEL; BEL;true; officially-assigned;true; Western European and Others Group;{ EUR:{ name: Euro; symbol:}};{ +3;[·2]};[ Brussels];[ BE; België; Belgie; Belgien; Belgique; Kingdom of Belgium; Koninkrijk België; Royaume de Belgique; Königreich Belgien]; Europe; Western Europe;{ deu: German; fra: French; nld: Dutch};{{ مملكة بلجيكا; بلجيكا};{ Rouantelezh Belgia; Belgia};{ Belgické království; Belgie};{ Königreich Belgien; Belgien};{ Belgia Kuningriik; Belgia};{ Belgian kuningaskunta; Belgia};{ Royaume de Belgique; Belgique};{ Kraljevina Belgija; Belgija};{ Belga Királyság; Belgium};{ Regno del Belgio; Belgio};{·ルギー王国;·ルギー};{기에;기에};{ Koninkrijk België; België};{ پادشاهی بلژیک; بلژیک};{ Klestwo Belgii; Belgia};{ Reino da Bélgica; Bélgica};{ Королевство Бельгия; Бельгия};{ Belgické kľovstvo; Belgicko};{ Reino de Bélgica; Bélgica};{ Kraljevina Belgija; Belgija};{ Konungariket Belgien; Belgien};{ Belçika Krallığı; Belçika};{ مملکتِ بلجئیم; بلجئیم};{·比利时王国;·比利时}};[·50.83333333;·4];false;[ FRA; DEU; LUX; NLD];·30528;;{{ Belgian; Belgian};{ Belge; Belge}}↵
{ Benin; Republic of Benin;{ fra:{ official: République du Bénin; common: Bénin}}};[ .bj]; BJ;·204; BEN; BEN;true; officially-assigned;true; African Group;{ XOF:{ name: West African CFA franc; symbol: Fr}};{ +2;[·29]};[ Porto-Novo];[ BJ; Republic of Benin; République du Bénin]; Africa; Western Africa;{ fra: French};{{ جمهورية بنين; بنين};{ Republik Benin; Benin};{ Benins republika; Benin};{ Republik Benin; Benin};{ Benini Vabariik; Benin};{ Beninin tasavalta; Benin};{ République du Bénin; Bénin};{ Republika Benin; Benin};{ Beniniztársaság; Benin};{ Repubblica del Benin; Benin};{·共和国;·};{;};{ Republiek Benin; Benin};{ جمهوری بنین; بنین};{ Benin; Benin};{ República do Benin; Benin};{ Республика Бенин; Бенин};{ Benins republika; Benin};{ República de Benin; Benín};{ Republika Benin; Benin};{ Republiken Benin; Benin};{ Benin Cumhuriyeti; Benin};{ جمہوریہ بینن; بینن};{·共和国;·}};[·9.5;·2.25];false;[ BFA; NER; NGA; TGO];·112622;;{{ Beninese; Beninese};{ Béninoise; Béninois}}↵
{ Burkina Faso; Burkina Faso;{ fra:{ official: République du Burkina; common: Burkina Faso}}};[ .bf]; BF;·854; BFA; BUR;true; officially-assigned;true; African Group;{ XOF:{ name: West African CFA franc; symbol: Fr}};{ +2;[·26]};[ Ouagadougou];[ BF]; Africa; Western Africa;{ fra: French};{{ بوركينا فاسو; بوركينا فاسو};{ Burkina Faso; Burkina Faso};{ Burkina Faso; Burkina Faso};{ Burkina Faso; Burkina Faso};{ Burkina Faso; Burkina Faso};{ Burkina Faso; Burkina Faso};{ République du Burkina; Burkina Faso};{ Burkina Faso; Burkina Faso};{ Burkina Faso; Burkina};{ Burkina Faso; Burkina Faso};{·ブルファ;·ブルファ};{;};{ Burkina Faso; Burkina Faso};{ بورکینافاسو; بورکینافاسو};{ Burkina Faso; Burkina Faso};{ Burkina Faso; Burkina Faso};{ Буркина -Фасо; Буркина-Фасо};{ Burkina Faso; Burkina Faso};{ Burkina Faso; Burkina Faso};{ Burkina Faso; Burkina Faso};{ Burkina Faso; Burkina Faso};{ Burkina Faso; Burkina Faso};{ برکینا فاسو; برکینا فاسو};{·;·}};[·13; -2];true;[ BEN; CIV; GHA; MLI; NER; TGO];·272967;;{{ Burkinabe; Burkinabe};{ Burkinabée; Burkinabé}}↵
{ Bangladesh; People's Republic of Bangladesh;{ ben:{ official: বাংলাদেশ গণপ্রজাতন্ত্র; common: বাংলাদেশ}}};[ .bd]; BD;·050; BGD; BAN;true; officially-assigned;true; Asia and the Pacific Group;{ BDT:{ name: Bangladeshi taka; symbol:·}};{ +8;[·80]};[ Dhaka];[ BD; People's Republic of Bangladesh; Gônôprôjatôntri Bangladesh]; Asia; Southern Asia;{ ben: Bengali};{{ جمهورية بنغلاديش الشعبية; بنغلاديش};{ Republik pobl Bangladesh; Bangladesh};{ Bangladéšská lidová republika; Bangladéš};{ Volksrepublik Bangladesch; Bangladesch};{ Bangladeshi Rahvavabariik; Bangladesh};{ Bangladeshin kansantasavalta; Bangladesh};{ La République populaire du Bangladesh; Bangladesh};{ Narodna Republika Bangladeš; Bangladeš};{ Banglades; Banglades};{ Repubblica popolare del Bangladesh; Bangladesh};{·ングシュ人民共和国;·ングシュ};{;};{ Volksrepubliek Bangladesh; Bangladesh};{ جمهوری خلق بنگلادش; بنگلادش};{ Ludowa Republika Bangladeszu; Bangladesz};{ República Popular do Bangladesh; Bangladesh};{ Народная Республика Бангладеш; Бангладеш};{ Bangladéšskaudová republika; Bangladéš};{ República Popular de Bangladesh; Bangladesh};{ Narodna Republika Bangladeš; Bangladeš};{ Folkrepubliken Bangladesh; Bangladesh};{ Bangladeş Halk Cumhuriyeti; Bangladeş};{ عوامی جمہوریہ بنگلہ دیش; بنگلہ دیش};{·加拉人民共和国;·加拉}};[·24;·90];false;[ MMR; IND];·147570;;{{ Bangladeshi; Bangladeshi};{ Bangladaise; Bangladais}}↵
{ Bulgaria; Republic of Bulgaria;{ bul:{ official: Република България; common: България}}};[ .bg]; BG;·100; BGR; BUL;true; officially-assigned;true; Eastern European Group;{ BGN:{ name: Bulgarian lev; symbol: лв}};{ +3;[·59]};[ Sofia];[ BG; Republic of Bulgaria; Република България]; Europe; Southeast Europe;{ bul: Bulgarian};{{ جمهورية بلغاريا; بلغاريا};{ Republik Bulgaria; Bulgaria};{ Bulhars republika; Bulharsko};{ Republik Bulgarien; Bulgarien};{ Bulgaaria Vabariik; Bulgaaria};{ Bulgarian tasavalta; Bulgaria};{ République de Bulgarie; Bulgarie};{ Republika Bugarska; Bugarska};{ Bolgárztársaság; Bulgária};{ Repubblica di Bulgaria; Bulgaria};{·ブルリア共和国;·ブルリア};{리아;리아};{ Republiek Bulgarije; Bulgarije};{ جمهوری بلغارستان; بلغارستان};{ Republika Bułgarii; Bułgaria};{ República da Bulgária; Bulgária};{ Республика Болгария; Болгария};{ Bulhars republika; Bulharsko};{ República de Bulgaria; Bulgaria};{ Republika Bugarska; Bugarska};{ Republiken Bulgarien; Bulgarien};{ Bulgaristan Cumhuriyeti; Bulgaristan};{ جمہوریہ بلغاریہ; بلغاریہ};{·利亚共和国;·利亚}};[·43;·25];false;[ GRC; MKD; ROU; SRB; TUR];·110879;;{{ Bulgarian; Bulgarian};{ Bulgare; Bulgare}}↵
{ Bahrain; Kingdom of Bahrain;{ ara:{ official: مملكة البحرين; common: البحرين}}};[ .bh]; BH;·048; BHR; BRN;true; officially-assigned;true; Asia and the Pacific Group;{ BHD:{ name: Bahraini dinar; symbol: .د.ب}};{ +9;[·73]};[ Manama];[ BH; Kingdom of Bahrain; Mamlakat al-Barayn]; Asia; Western Asia;{ ara: Arabic};{{ مملكة البحرين; البحرين};{ Rouantelezh Bahrein; Bahrein};{ Království Bahrajn; Bahrajn};{ Königreich Bahrain; Bahrain};{ Bahreini Kuningriik; Bahrein};{ Bahrainin kuningaskunta; Bahrain};{ Royaume de Bahreïn; Bahreïn};{ Kraljevina Bahrein; Bahrein};{ Bahreini Királyság; Bahrein};{ Regno del Bahrain; Bahrein};{·ー�ーン王国;·ー�ーン};{;};{ Koninkrijk Bahrein; Bahrein};{ پادشاهی بحرین; بحرین};{ Klestwo Bahrajnu; Bahrajn};{ Reino do Bahrein; Bahrein};{ Королевство Бахрейн; Бахрейн};{ Bahrajnské kľovstvo; Bahrajn};{ Reino de Bahrein; Bahrein};{ Kraljevina Bahrein; Bahrein};{ Konungariket Bahrain; Bahrain};{ Bahreyn Krallığı; Bahreyn};{ مملکتِ بحرین; بحرین};{·王国;·}};[·26;·50.55];false;[];·765;;{{ Bahraini; Bahraini};{ Bahreïnienne; Bahreïnien}}
... (truncated)
minemizer (compact)
chars: 299,485 tokens: 124,200 chars_og/tok: 9.1 enc_chars/tok: 2.4
<|begin▁of▁sentence|>name{common;official;native{...}};tld[];cca2;ccn3;cca3;cioc;independent;status;unMember;unRegionalGroup;currencies{...};idd{root;suffixes[]};capital[];altSpellings[];region;subregion;languages{...};translations{ara{official;common};bre{official;common};ces{official;common};deu{official;common};est{official;common};fin{official;common};fra{official;common};hrv{official;common};hun{official;common};ita{official;common};jpn{official;common};kor{official;common};nld{official;common};per{official;common};pol{official;common};por{official;common};rus{official;common};slk{official;common};spa{official;common};srp{official;common};swe{official;common};tur{official;common};urd{official;common};zho{official;common}};latlng[];landlocked;borders[];area;flag;demonyms{eng{f;m};fra{f;m}}↵
{Aruba;Aruba;{nld:{official:Aruba;common:Aruba};pap:{official:Aruba;common:Aruba}}};[.aw];AW;533;ABW;ARU;false;officially-assigned;false;;{AWG:{name:Aruban florin;symbol:ƒ}};{+2;[97]};[Oranjestad];[AW];Americas;Caribbean;{nld:Dutch;pap:Papiamento};{{أروبا;أروبا};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{アル;アル};{;};{Aruba;Aruba};{آروبا;آروبا};{Aruba;Aruba};{Aruba;Aruba};{Аруба;Аруба};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{Aruba;Aruba};{اروبا;اروبا};{;}};[12.5;-69.96666666];false;[];180;;{{Aruban;Aruban};{Arubaise;Arubais}}↵
{Afghanistan;Islamic Republic of Afghanistan;{prs:{official:جمهوری اسلامی افغانستان;common:افغانستان};pus:{official:د افغانستان اسلامي جمهوریت;common:افغانستان};tuk:{official:Owganystan Yslam Respublikasy;common:Owganystan}}};[.af];AF;004;AFG;AFG;true;officially-assigned;true;Asia and the Pacific Group;{AFN:{name:Afghan afghani;symbol:}};{+9;[3]};[Kabul];[AF;Afānistān];Asia;Southern Asia;{prs:Dari;pus:Pashto;tuk:Turkmen};{{جمهورية أففانستان الإسلامية;أفغانستان};{Republik Islamek Afghanistan;Afghanistan};{Afghánská isms republika;Afghánistán};{Islamische Republik Afghanistan;Afghanistan};{Afganistani Islamivabariik;Afganistan};{Afganistanin islamilainen tasavalta;Afganistan};{République islamique d'Afghanistan;Afghanistan};{Islamska Republika Afganistan;Afganistan};{Afganisztáni Iszlámztársaság;Afganisztán};{Repubblica islamica dell'Afghanistan;Afghanistan};{スタ共和国;スタ};{;};{Islamitische Republiek Afghanistan;Afghanistan};{جمهوری اسلامی افغانستان;افغانستان};{Islamska Republika Afganistanu;Afganistan};{República Islâmica do Afeganistão;Afeganistão};{Исламская Республика Афганистан;Афганистан};{Afgánsky islamský štát;Afganistan};{República Islámica de Afganistán;Afganistán};{Islamska Republika Avganistan;Avganistan};{Islamiska republiken Afghanistan;Afghanistan};{Afganistan İslam Cumhuriyeti;Afganistan};{اسلامی جمہوریہ افغانستان;افغانستان};{阿富汗伊斯兰共和国;阿富汗}};[33;65];true;[IRN;PAK;TKM;UZB;TJK;CHN];652230;;{{Afghan;Afghan};{Afghane;Afghan}}↵
{Angola;Republic of Angola;{por:{official:República de Angola;common:Angola}}};[.ao];AO;024;AGO;ANG;true;officially-assigned;true;African Group;{AOA:{name:Angolan kwanza;symbol:Kz}};{+2;[44]};[Luanda];[AO;República de Angola;ʁɛpublika de an'ɡɔla];Africa;Middle Africa;{por:Portuguese};{{أنغولا;جمهورية أنغولا};{Republik Angola;Angola};{Angolská republika;Angola};{Republik Angola;Angola};{Angola Vabariik;Angola};{Angolan tasavalta;Angola};{République d'Angola;Angola};{Republika Angola;Angola};{Angola;Angola};{Repubblica dell'Angola;Angola};{共和国;};{;};{Republiek Angola;Angola};{جمهوری آنگولا;آنگولا};{Republika Angoli;Angola};{República de Angola;Angola};{Республика Ангола;Ангола};{Angolská republika;Angola};{República de Angola;Angola};{Republika Angola;Angola};{Republiken Angola;Angola};{Angola Cumhuriyeti;Angola};{جمہوریہ انگولہ;انگولہ};{共和国;}};[-12.5;18.5];false;[COG;COD;ZMB;NAM];1246700;;{{Angolan;Angolan};{Angolaise;Angolais}}↵
{Anguilla;Anguilla;{eng:{official:Anguilla;common:Anguilla}}};[.ai];AI;660;AIA;;false;officially-assigned;false;;{XCD:{name:Eastern Caribbean dollar;symbol:$}};{+1;[264]};[The Valley];[AI];Americas;Caribbean;{eng:English};{{أنغويلا;أنغويلا};{Anguilla;Anguilla};{Anguilla;Anguilla};{Anguilla;Anguilla};{Anguilla;Anguilla};{Anguilla;Anguilla};{Anguilla;Anguilla};{Anguilla;Angvila};{Anguilla;Anguilla};{Anguilla;Anguilla};{;};{;};{Anguilla;Anguilla};{آنگویلا;آنگویلا};{Anguilla;Anguilla};{Anguilla;Anguilla};{Ангилья;Ангилья};{Anguilla;Anguilla};{Anguila;Anguilla};{Angvila;Angvila};{Anguilla;Anguilla};{Anguilla;Anguilla};{اینگویلا;اینگویلا};{;}};[18.25;-63.16666666];false;[];91;;{{Anguillian;Anguillian};{Anguillane;Anguillan}}↵
{Åland Islands;Åland Islands;{swe:{official:Landskapet Åland;common:Åland}}};[.ax];AX;248;ALA;;false;officially-assigned;false;;{EUR:{name:Euro;symbol:}};{+3;[5818]};[Mariehamn];[AX;Aaland;Aland;Ahvenanmaa];Europe;Northern Europe;{swe:Swedish};{{جزر أولاند;جزر أولاند};{Inizi Åland;Åland};{Ålandské ostrovy;Ålandy};{Åland-Inseln;Åland};{Ahvenamaa maakond;Ahvenamaa};{Ahvenanmaan maakunta;Ahvenanmaa};{Ahvenanmaa;Ahvenanmaa};{Aland Islands;Ålandski otoci};{Åland-szigetek;Åland-szigetek};{Isole Åland;Isole Aland};{ンド;ンド};{;};{Åland eilanden;Ålandeilanden};{جزایر الند;جزایر الند};{Wyspy Alandzkie;Wyspy Alandzkie};{Ilhas Åland;Alândia};{Аландские острова;Аландские острова};{Alandské ostrovy;Alandy};{Islas Åland;Alandia};{Olandska Ostrva;Olandska Ostrva};{Åland;Åland};{Åland Adaları;Åland};{جزائر اولند;جزائر اولند};{群岛;群岛}};[60.116667;19.9];false;[];1580;;{{Ålandish;Ålandish};{Ålandaise;Ålandais}}↵
{Albania;Republic of Albania;{sqi:{official:Republika e Shqipërisë;common:Shqipëria}}};[.al];AL;008;ALB;ALB;true;officially-assigned;true;Eastern European Group;{ALL:{name:Albanian lek;symbol:L}};{+3;[55]};[Tirana];[AL;Shqipëri;Shqipëria;Shqipnia];Europe;Southeast Europe;{sqi:Albanian};{{جمهورية ألبانيا;ألبانيا};{Republik Albania;Albania};{Albánská republika;Albánie};{Republik Albanien;Albanien};{Albaania Vabariik;Albaania};{Albanian tasavalta;Albania};{République d'Albanie;Albanie};{Republika Albanija;Albanija};{Albánztársaság;Albánia};{Repubblica d'Albania;Albania};{アルニア共和国;アルニア};{;};{Republiek Alban;Albanië};{جمهوری آلبانی;آلبانی};{Republika Albanii;Albania};{República da Albânia;Albânia};{Республика Албания;Албания};{Albánska republika;Albánsko};{República de Albania;Albania};{Republika Albanija;Albanija};{Republiken Albanien;Albanien};{Arnavutluk Cumhuriyeti;Arnavutluk};{جمہوریہ البانیا;البانیا};{阿尔尼亚共和国;阿尔尼亚}};[41;20];false;[MNE;GRC;MKD;UNK];28748;;{{Albanian;Albanian};{Albanaise;Albanais}}↵
{Andorra;Principality of Andorra;{cat:{official:Principat d'Andorra;common:Andorra}}};[.ad];AD;020;AND;AND;true;officially-assigned;true;Western European and Others Group;{EUR:{name:Euro;symbol:}};{+3;[76]};[Andorra la Vella];[AD;Principality of Andorra;Principat d'Andorra];Europe;Southern Europe;{cat:Catalan};{{إمارة أندورا;أندورا};{Priñselezh Andorra;Andorra};{Andorrské kžect;Andorra};{Fürstentum Andorra;Andorra};{Andorra Vürstiriik;Andorra};{Andorran ruhtinaskunta;Andorra};{Principauté d'Andorre;Andorre};{Kneževina Andora;Andora};{Andorra;Andorra};{Principato di Andorra;Andorra};{ンド;ンド};{;};{Prinsdom Andorra;Andorra};{شاهزادهنشین آندورا;آندورا};{Księstwo Andory;Andora};{Principado de Andorra;Andorra};{Княжество Андорра;Андорра};{Andorrské kniežatstvo;Andorra};{Principado de Andorra;Andorra};{Kneževina Andora;Andora};{Furstendömet Andorra;Andorra};{Andorra Prensliği;Andorra};{اماراتِ انڈورا;انڈورا};{;}};[42.5;1.5];true;[FRA;ESP];468;;{{Andorran;Andorran};{Andorrane;Andorran}}↵
{United Arab Emirates;United Arab Emirates;{ara:{official:الإمارات العربية المتحدة;common:الإمارات}}};[.ae;امارات.];AE;784;ARE;UAE;true;officially-assigned;true;Asia and the Pacific Group;{AED:{name:United Arab Emirates dirham;symbol:د.إ}};{+9;[71]};[Abu Dhabi];[AE;UAE;Emirates];Asia;Western Asia;{ara:Arabic};{{الإمارات العربية المتحدة;الإمارات};{Emirelezhioù Arab Unanet;Emirelezhioù Arab Unanet};{Spojené arabs emiráty;Spojené arabs emiráty};{Vereinigte Arabische Emirate;Vereinigte Arabische Emirate};{Araabia Ühendemiraadid;Araabia Ühendemiraadid};{Yhdistyneet arabiemiirikunnat;Arabiemiraatit};{Émirats arabes unis;Émirats arabes unis};{Ujedinjeni Arapski Emirati;Ujedinjeni Arapski Emirati};{Egyesült Arab Emírségek;Egyesült Arab Emírségek};{Emirati Arabi Uniti;Emirati Arabi Uniti};{;UAE};{;};{Verenigde Arabische Emiraten;Verenigde Arabische Emiraten};{امارات متحده عربی;امارات};{Zjednoczone Emiraty Arabskie;Zjednoczone Emiraty Arabskie};{Emirados Árabes Unidos;Emirados Árabes Unidos};{Объединенные Арабские Эмираты;Объединённые Арабские Эмираты};{Spojené arabs emiráty;Spojené arabs emiráty};{Emiratos Árabes Unidos;Emiratos Árabes Unidos};{Ujedinjeni Arapski Emirati;Ujedinjeni Arapski Emirati};{Förenade Arabemiraten;Förenade Arabemiraten};{Birleşik Arap Emirlikleri;Birleşik Arap Emirlikleri};{متحدہ عرب امارات;متحدہ عرب امارات};{阿拉伯联合;阿拉伯联合}};[24;54];false;[OMN;SAU];83600;;{{Emirati;Emirati};{Emirienne;Emirien}}↵
{Argentina;Argentine Republic;{grn:{official:Argentine Republic;common:Argentina};spa:{official:República Argentina;common:Argentina}}};[.ar];AR;032;ARG;ARG;true;officially-assigned;true;Latin American and Caribbean Group;{ARS:{name:Argentine peso;symbol:$}};{+5;[4]};[Buenos Aires];[AR;Argentine Republic;República Argentina];Americas;South America;{grn:Guaraní;spa:Spanish};{{جمهورية الأرجنتين;الأرجنتين};{Republik Arc'hantina;Arc'hantina};{Argentins republika;Argentina};{Argentinische Republik;Argentinien};{Argentina Vabariik;Argentina};{Argentiinan tasavalta;Argentiina};{République argentine;Argentine};{Argentinski Republika;Argentina};{Argentinztársaság;Argentína};{Repubblica Argentina;Argentina};{アルンチ共和国;アルンチ};{;};{Argentijnse Republiek;Argentinië};{جمهوری آرژانتین;آرژانتین};{Republika Argentyńska;Argentyna};{República Argentina;Argentina};{Аргентинская Республика;Аргентина};{Argentínska republika;Argentína};{República Argentina;Argentina};{Republika Argentina;Argentina};{Republiken Argentina;Argentina};{Arjantin Cumhuriyeti;Arjantin};{جمہوریہ ارجنٹائن;ارجنٹائن};{阿根廷共和国;阿根廷}};[-34;-64];false;[BOL;BRA;CHL;PRY;URY];2780400;;{{Argentine;Argentine};{Argentine;Argentin}}↵
{Armenia;Republic of Armenia;{hye:{official:Հայաստանի Հանրապետություն;common:Հայաստան}}};[.am];AM;051;ARM;ARM;true;officially-assigned;true;Eastern European Group;{AMD:{name:Armenian dram;symbol:}};{+3;[74]};[Yerevan];[AM;Hayastan;Republic of Armenia;Հայաստանի Հանրապետություն];Asia;Western Asia;{hye:Armenian};{{جمهورية أرمينيا;أرمينيا};{Republik Armenia;Armenia};{Arménská republika;Arménie};{Republik Armenien;Armenien};{Armeenia Vabariik;Armeenia};{Armenian tasavalta;Armenia};{République d'Arménie;Arménie};{Republika Armenija;Armenija};{Örményország;Örményország};{Repubblica di Armenia;Armenia};{アルニア共和国;アルニア};{;};{Republiek Armen;Armenië};{جمهوری ارمنستان;ارمنستان};{Republika Armenii;Armenia};{República da Arménia;Arménia};{Республика Армения;Армения};{Arménska republika;Arménsko};{República de Armenia;Armenia};{Republika Jermenija;Jermenija};{Republiken Armenien;Armenien};{Ermenistan Cumhuriyeti;Ermenistan};{جمہوریہ آرمینیا;آرمینیا};{尼亚共和国;尼亚}};[40;45];true;[AZE;GEO;IRN;TUR];29743;;{{Armenian;Armenian};{Arménienne;Arménien}}↵
{American Samoa;American Samoa;{eng:{official:American Samoa;common:American Samoa};smo:{official:Sāmoa Amelika;common:Sāmoa Amelika}}};[.as];AS;016;ASM;ASA;false;officially-assigned;false;;{USD:{name:United States dollar;symbol:$}};{+1;[684]};[Pago Pago];[AS;Amerika Sāmoa;Amelika Sāmoa;Sāmoa Amelika];Oceania;Polynesia;{eng:English;smo:Samoan};{{ساموا الأمريكية;ساموا الأمريكية};{Samoa Amerikan;Samoa Amerikan};{Americká Samoa;Americká Samoa};{Amerikanisch-Samoa;Amerikanisch-Samoa};{Ameerika Samoa;Ameerika Samoa};{Amerikan Samoa;Amerikan Samoa};{Samoa américaines;Samoa américaines};{amerka Samoa;Američka Samoa};{Szamoa;Szamoa};{Samoa americane;Samoa Americane};{;アメリカ};{;};{Amerikaans Samoa;Amerikaans Samoa};{ساموآی آمریکا;ساموآی آمریکا};{Samoa Amerykańskie;Samoa Amerykańskie};{Samoa americana;Samoa Americana};{американское Самоа;Американское Самоа};{Americká Samoa;Americká Samoa};{Samoa Americana;Samoa Americana};{Amerka Samoa;Američka Samoa};{Amerikanska Samoa;Amerikanska Samoa};{Amerikan Samoası;Amerikan Samoası};{امریکی سمووا;امریکی سمووا};{;}};[-14.33333333;-170];false;[];199;;{{American Samoan;American Samoan};{Samoane;Samoan}}↵
{Antarctica;Antarctica;{}};[.aq];AQ;010;ATA;;false;officially-assigned;false;;{};{;[]};[];[AQ];Antarctic;;{};{{أنتارتيكا;أنتارتيكا};{Antarktika;Antarktika};{Antarktida;Antarktida};{Antarktika;Antarktis};{Antarktika;Antarktika};{Etelämanner;Etelämanner};{Antarctique;Antarctique};{Antarktika;Antarktika};{Antarktisz;Antarktisz};{Antartide;Antartide};{;大陸};{;};{Antarctica;Antarctica};{جنوبگان;جنوبگان};{Antarktyka;Antarktyka};{Antártica;Antártida};{Антарктида;Антарктида};{Antarktída;Antarktída};{Antártida;Antártida};{Antarktik;Antarktik};{Antarktis;Antarktis};{Antarktika;Antarktika};{انٹارکٹکا;انٹارکٹکا};{南极;南极}};[-90;0];false;[];14000000;;{{Antarctican;Antarctican};{Antarcticaine;Antarcticain}}↵
{French Southern and Antarctic Lands;Territory of the French Southern and Antarctic Lands;{fra:{official:Territoire des Terres australes et antarctiques françaises;common:Terres australes et antarctiques françaises}}};[.tf];TF;260;ATF;;false;officially-assigned;false;;{EUR:{name:Euro;symbol:}};{+2;[62]};[Port-aux-Français];[TF;French Southern Territories];Antarctic;;{fra:French};{{مقاطعات وأقاليم ما وراء البحار الفرنسية;أراض فرنسية جنوبية وأنتارتيكية};{Tiriad Douaroù Aostral hag Antarktikel Frañs;Douaroù Aostral hag Antarktikel Frañs};{Teritorium Francouzská již a antarktická území;Francouzská již a antarktická území};{Gebiet der Französisch Süd- und Antarktisgebiete;Französische Süd- und Antarktisgebiete};{Prantsuse Lõunaalad;Prantsuse Lõunaalad};{Ranskan eteläiset ja antarktiset alueet;Ranskan eteläiset ja antarktiset alueet};{Territoire des Terres australes et antarctiques françaises;Terres australes et antarctiques françaises};{Teritoriju Francuski južni i antarktički teritoriji;Francuski južni i antarktički teritoriji};{Franciali és antarktiszi területek;Franciali és antarktiszi területek};{Territorio della australi e antartiche francesi Terre;Territori Francesi del Sud};{ランス;ランス南方地域};{ 지역; 지역};{Grondgebied van de Franse Zuidelijke en Antarctische gebieden;Franse Gebieden in de zuidelijke Indische Oceaan};{سرزمینهای جنوبی و جنوبگانی فرانسه;سرزمینهای جنوبی و جنوبگانی فرانسه};{Francuskie Terytoria Południowe i Antarktyczne;Francuskie Terytoria Południowe i Antarktyczne};{Território do Sul e Antártica Francesa;Terras Austrais e Antárticas Francesas};{Территория Французские Южные и Антарктические земли;Французские Южные и Антарктические территории};{Francúzske juž a antarktické územia;Francúzske juŽ a antarktické územia};{Territorio del Francés Tierras australes y antárticas;Tierras Australes y Antárticas Francesas};{Francuske južne i antarktičke zemlje;Francuske južne i antarktičke zemlje};{Franska syd- och Antarktisterritorierna;Franska södra territorierna};{Fransızney ve Antarktika Toprakları;Fransızney ve Antarktika Toprakları};{سرزمینِ جنوبی فرانسیسیہ و انٹارکٹیکہ;سرزمین جنوبی فرانسیسیہ و انٹارکٹیکا};{法国南部南极土地;法国南部南极土地}};[-49.25;69.167];false;[];7747;;{{French;French};{Française;Français}}↵
{Antigua and Barbuda;Antigua and Barbuda;{eng:{official:Antigua and Barbuda;common:Antigua and Barbuda}}};[.ag];AG;028;ATG;ANT;true;officially-assigned;true;Latin American and Caribbean Group;{XCD:{name:Eastern Caribbean dollar;symbol:$}};{+1;[268]};[Saint John's];[AG];Americas;Caribbean;{eng:English};{{أنتيغوا وباربودا;أنتيغوا وباربودا};{Antigua ha Barbuda;Antigua ha Barbuda};{Antigua a Barbuda;Antigua a Barbuda};{Antigua und Barbuda;Antigua und Barbuda};{Antigua ja Barbuda;Antigua ja Barbuda};{Antigua ja Barbuda;Antigua ja Barbuda};{Antigua -et-Barbuda;Antigua-et-Barbuda};{Antigva i Barbuda;Antigva i Barbuda};{Antigua és Barbuda;Antigua és Barbuda};{Antigua e Barbuda;Antigua e Barbuda};{ン��ィーブー�;ン��ィーブー�};{;};{Antigua en Barbuda;Antigua en Barbuda};{آنتیگوا و باربودا;آنتیگوا و باربودا};{Antigua i Barbuda;Antigua i Barbuda};{Antigua e Barbuda;Antígua e Barbuda};{Антигуа и Барбуда;Антигуа и Барбуда};{Antigua a Barbuda;Antigua a Barbuda};{Antigua y Barbuda;Antigua y Barbuda};{Antigva i Barbuda;Antigva i Barbuda};{Antigua och Barbuda;Antigua och Barbuda};{Antigua ve Barbuda;Antigua ve Barbuda};{اینٹیگوا و باربوڈا;اینٹیگوا و باربوڈا};{;}};[17.05;-61.8];false;[];442;;{{Antiguan, Barbudan;Antiguan, Barbudan};{Antiguaise et barbudienne;Antiguaise et barbudien}}↵
{Australia;Commonwealth of Australia;{eng:{official:Commonwealth of Australia;common:Australia}}};[.au];AU;036;AUS;AUS;true;officially-assigned;true;Western European and Others Group;{AUD:{name:Australian dollar;symbol:$}};{+6;[1]};[Canberra];[AU];Oceania;Australia and New Zealand;{eng:English};{{كومونولث أستراليا;أستراليا};{Kenglad Aostralia;Aostralia};{Australs společenství;Austrálie};{Commonwealth Australien;Australien};{Austraalia Ühendus;Austraalia};{Australian liittovaltio;Australia};{Australie;Australie};{Commonwealth of Australia;Australija};{Ausztrál Államszövetség;Ausztrália};{Commonwealth dell'Australia;Australia};{ストリア;ストリア};{스트리아;};{Gemenebest van Austral;Australië};{قلمرو همسود استرالیا;استرالیا};{Związek Australijski;Australia};{Comunidade da Austrália;Austrália};{Содружество Австралии;Австралия};{Austrálsky zz;Austrália};{Mancomunidad de Australia;Australia};{Komonvelt Australija;Australija};{Australiska statsförbundet;Australien};{Avustralya Federal Devleti;Avustralya};{دولتِ مشترکہ آسٹریلیا;آسٹریلیا};{澳大利亚联邦;澳大利亚}};[-27;133];false;[];7692024;;{{Australian;Australian};{Australienne;Australien}}↵
{Austria;Republic of Austria;{bar:{official:Republik Österreich;common:Österreich}}};[.at];AT;040;AUT;AUT;true;officially-assigned;true;Western European and Others Group;{EUR:{name:Euro;symbol:}};{+4;[3]};[Vienna];[AT;Osterreich;Oesterreich];Europe;Central Europe;{bar:Austro-Bavarian German};{{جمهورية النمسا;النمسا};{Republik Aostria;Aostria};{Rakous republika;Rakousko};{Republik Österreich;Österreich};{Austria Vabariik;Austria};{Itävallan tasavalta;Itävalta};{République d'Autriche;Autriche};{Republika Austrija;Austrija};{Ausztria;Ausztria};{Repubblica d'Austria;Austria};{ストリア共和国;ストリア};{스트리아;스트리아};{Republiek Oostenrijk;Oostenrijk};{جمهوری اتریش;اتریش};{Republika Austrii;Austria};{República da Áustria;Áustria};{Австрийская Республика;Австрия};{Rakúska republika;Rakúsko};{República de Austria;Austria};{Republika Austrija;Austrija};{Republiken Österrike;Österrike};{Avusturya Cumhuriyeti;Avusturya};{جمہوریہ آسٹریا;آسٹریا};{奥地利共和国;奥地利}};[47.33333333;13.33333333];true;[CZE;DEU;HUN;ITA;LIE;SVK;SVN;CHE];83871;;{{Austrian;Austrian};{Autrichienne;Autrichien}}↵
{Azerbaijan;Republic of Azerbaijan;{aze:{official:Azərbaycan Respublikası;common:Azərbaycan};rus:{official:Азербайджанская Республика;common:Азербайджан}}};[.az];AZ;031;AZE;AZE;true;officially-assigned;true;Eastern European Group;{AZN:{name:Azerbaijani manat;symbol:}};{+9;[94]};[Baku];[AZ;Republic of Azerbaijan;Azərbaycan Respublikası];Asia;Western Asia;{aze:Azerbaijani;rus:Russian};{{جمهورية أذربيجان;أذربيجان};{Republik Azerbaidjan;Azerbaidjan};{Ázerbájdžánská republika;Ázerbájdžán};{Republik Aserbaidschan;Aserbaidschan};{Aserbaidžaani Vabariik;Aserbaidžaan};{Azerbaidzanin tasavalta;Azerbaidzan};{République d'Azerbaïdjan;Azerbaïdjan};{Republika Azerbajdžan;Azerbajdžan};{Azerbajdzsán;Azerbajdzsán};{Repubblica dell'Azerbaigian;Azerbaijan};{バイジャ共和国;バイジャ};{;};{Republiek Azerbeidzjan;Azerbeidzjan};{جمهوری آذربایجان;جمهوری آذربایجان};{Republika Azerbejdżanu;Azerbejdżan};{República do Azerbaijão;Azerbeijão};{Азербайджанская Республика;Азербайджан};{Azerbajanská republika;Azerbajan};{República de Azerbaiyán;Azerbaiyán};{Republika Azerbejdžan;Azerbejdžan};{Republiken Azerbajdzjan;Azerbajdzjan};{Azerbaycan Cumhuriyeti;Azerbaycan};{جمہوریہ آذربائیجان;آذربائیجان};{共和国;}};[40.5;47.5];true;[ARM;GEO;IRN;RUS;TUR];86600;;{{Azerbaijani;Azerbaijani};{Azerbaïdjanaise;Azerbaïdjanais}}↵
{Burundi;Republic of Burundi;{fra:{official:République du Burundi;common:Burundi};run:{official:Republika y'Uburundi ;common:Uburundi}}};[.bi];BI;108;BDI;BDI;true;officially-assigned;true;African Group;{BIF:{name:Burundian franc;symbol:Fr}};{+2;[57]};[Gitega];[BI;Republic of Burundi;Republika y'Uburundi;République du Burundi];Africa;Eastern Africa;{fra:French;run:Kirundi};{{جمهورية بوروندي;بوروندي};{Republik Burundi;Burundi};{Burundská republika;Burundi};{Republik Burundi;Burundi};{Burundi Vabariik;Burundi};{Burundin tasavalta;Burundi};{République du Burundi;Burundi};{Burundi;Burundi};{Burundi;Burundi};{Repubblica del Burundi;Burundi};{ブルンジ共和国;ブルンジ};{;};{Republiek Burundi;Burundi};{جمهوری بوروندی;بوروندی};{Republika Burundi;Burundi};{República do Burundi;Burundi};{Республика Бурунди;Бурунди};{Burundská republika;Burundi};{República de Burundi;Burundi};{Republika Burundi;Burundi};{Republiken Burundi;Burundi};{Burundi Cumhuriyeti;Burundi};{جمہوریہ برونڈی;برونڈی};{共和国;}};[-3.5;30];true;[COD;RWA;TZA];27834;;{{Burundian;Burundian};{Burundaise;Burundais}}↵
{Belgium;Kingdom of Belgium;{deu:{official:Königreich Belgien;common:Belgien};fra:{official:Royaume de Belgique;common:Belgique};nld:{official:Koninkrijk België;common:België}}};[.be];BE;056;BEL;BEL;true;officially-assigned;true;Western European and Others Group;{EUR:{name:Euro;symbol:}};{+3;[2]};[Brussels];[BE;België;Belgie;Belgien;Belgique;Kingdom of Belgium;Koninkrijk België;Royaume de Belgique;Königreich Belgien];Europe;Western Europe;{deu:German;fra:French;nld:Dutch};{{مملكة بلجيكا;بلجيكا};{Rouantelezh Belgia;Belgia};{Belgické království;Belgie};{Königreich Belgien;Belgien};{Belgia Kuningriik;Belgia};{Belgian kuningaskunta;Belgia};{Royaume de Belgique;Belgique};{Kraljevina Belgija;Belgija};{Belga Királyság;Belgium};{Regno del Belgio;Belgio};{ルギー王国;ルギー};{기에;기에};{Koninkrijk België;België};{پادشاهی بلژیک;بلژیک};{Klestwo Belgii;Belgia};{Reino da Bélgica;Bélgica};{Королевство Бельгия;Бельгия};{Belgické kľovstvo;Belgicko};{Reino de Bélgica;Bélgica};{Kraljevina Belgija;Belgija};{Konungariket Belgien;Belgien};{Belçika Krallığı;Belçika};{مملکتِ بلجئیم;بلجئیم};{比利时王国;比利时}};[50.83333333;4];false;[FRA;DEU;LUX;NLD];30528;;{{Belgian;Belgian};{Belge;Belge}}↵
{Benin;Republic of Benin;{fra:{official:République du Bénin;common:Bénin}}};[.bj];BJ;204;BEN;BEN;true;officially-assigned;true;African Group;{XOF:{name:West African CFA franc;symbol:Fr}};{+2;[29]};[Porto-Novo];[BJ;Republic of Benin;République du Bénin];Africa;Western Africa;{fra:French};{{جمهورية بنين;بنين};{Republik Benin;Benin};{Benins republika;Benin};{Republik Benin;Benin};{Benini Vabariik;Benin};{Beninin tasavalta;Benin};{République du Bénin;Bénin};{Republika Benin;Benin};{Beniniztársaság;Benin};{Repubblica del Benin;Benin};{共和国;};{;};{Republiek Benin;Benin};{جمهوری بنین;بنین};{Benin;Benin};{República do Benin;Benin};{Республика Бенин;Бенин};{Benins republika;Benin};{República de Benin;Benín};{Republika Benin;Benin};{Republiken Benin;Benin};{Benin Cumhuriyeti;Benin};{جمہوریہ بینن;بینن};{共和国;}};[9.5;2.25];false;[BFA;NER;NGA;TGO];112622;;{{Beninese;Beninese};{Béninoise;Béninois}}↵
{Burkina Faso;Burkina Faso;{fra:{official:République du Burkina;common:Burkina Faso}}};[.bf];BF;854;BFA;BUR;true;officially-assigned;true;African Group;{XOF:{name:West African CFA franc;symbol:Fr}};{+2;[26]};[Ouagadougou];[BF];Africa;Western Africa;{fra:French};{{بوركينا فاسو;بوركينا فاسو};{Burkina Faso;Burkina Faso};{Burkina Faso;Burkina Faso};{Burkina Faso;Burkina Faso};{Burkina Faso;Burkina Faso};{Burkina Faso;Burkina Faso};{République du Burkina;Burkina Faso};{Burkina Faso;Burkina Faso};{Burkina Faso;Burkina};{Burkina Faso;Burkina Faso};{ブルファ;ブルファ};{;};{Burkina Faso;Burkina Faso};{بورکینافاسو;بورکینافاسو};{Burkina Faso;Burkina Faso};{Burkina Faso;Burkina Faso};{Буркина -Фасо;Буркина-Фасо};{Burkina Faso;Burkina Faso};{Burkina Faso;Burkina Faso};{Burkina Faso;Burkina Faso};{Burkina Faso;Burkina Faso};{Burkina Faso;Burkina Faso};{برکینا فاسو;برکینا فاسو};{;}};[13;-2];true;[BEN;CIV;GHA;MLI;NER;TGO];272967;;{{Burkinabe;Burkinabe};{Burkinabée;Burkinabé}}↵
{Bangladesh;People's Republic of Bangladesh;{ben:{official:াংলাদেশ গণপ্রজাতন্ত্র;common:াংলাদেশ}}};[.bd];BD;050;BGD;BAN;true;officially-assigned;true;Asia and the Pacific Group;{BDT:{name:Bangladeshi taka;symbol:}};{+8;[80]};[Dhaka];[BD;People's Republic of Bangladesh;Gônôprôjatôntri Bangladesh];Asia;Southern Asia;{ben:Bengali};{{جمهورية بنغلاديش الشعبية;بنغلاديش};{Republik pobl Bangladesh;Bangladesh};{Bangladéšská lidová republika;Bangladéš};{Volksrepublik Bangladesch;Bangladesch};{Bangladeshi Rahvavabariik;Bangladesh};{Bangladeshin kansantasavalta;Bangladesh};{La République populaire du Bangladesh;Bangladesh};{Narodna Republika Bangladeš;Bangladeš};{Banglades;Banglades};{Repubblica popolare del Bangladesh;Bangladesh};{ングシュ人民共和国;ングシュ};{;};{Volksrepubliek Bangladesh;Bangladesh};{جمهوری خلق بنگلادش;بنگلادش};{Ludowa Republika Bangladeszu;Bangladesz};{República Popular do Bangladesh;Bangladesh};{Народная Республика Бангладеш;Бангладеш};{Bangladéšskaudová republika;Bangladéš};{República Popular de Bangladesh;Bangladesh};{Narodna Republika Bangladeš;Bangladeš};{Folkrepubliken Bangladesh;Bangladesh};{Bangladeş Halk Cumhuriyeti;Bangladeş};{عوامی جمہوریہ بنگلہ دیش;بنگلہ دیش};{加拉人民共和国;加拉}};[24;90];false;[MMR;IND];147570;;{{Bangladeshi;Bangladeshi};{Bangladaise;Bangladais}}↵
{Bulgaria;Republic of Bulgaria;{bul:{official:Република България;common:България}}};[.bg];BG;100;BGR;BUL;true;officially-assigned;true;Eastern European Group;{BGN:{name:Bulgarian lev;symbol:лв}};{+3;[59]};[Sofia];[BG;Republic of Bulgaria;Република България];Europe;Southeast Europe;{bul:Bulgarian};{{جمهورية بلغاريا;بلغاريا};{Republik Bulgaria;Bulgaria};{Bulhars republika;Bulharsko};{Republik Bulgarien;Bulgarien};{Bulgaaria Vabariik;Bulgaaria};{Bulgarian tasavalta;Bulgaria};{République de Bulgarie;Bulgarie};{Republika Bugarska;Bugarska};{Bolgárztársaság;Bulgária};{Repubblica di Bulgaria;Bulgaria};{ブルリア共和国;ブルリア};{리아;리아};{Republiek Bulgarije;Bulgarije};{جمهوری بلغارستان;بلغارستان};{Republika Bułgarii;Bułgaria};{República da Bulgária;Bulgária};{Республика Болгария;Болгария};{Bulhars republika;Bulharsko};{República de Bulgaria;Bulgaria};{Republika Bugarska;Bugarska};{Republiken Bulgarien;Bulgarien};{Bulgaristan Cumhuriyeti;Bulgaristan};{جمہوریہ بلغاریہ;بلغاریہ};{利亚共和国;利亚}};[43;25];false;[GRC;MKD;ROU;SRB;TUR];110879;;{{Bulgarian;Bulgarian};{Bulgare;Bulgare}}↵
{Bahrain;Kingdom of Bahrain;{ara:{official:مملكة البحرين;common:البحرين}}};[.bh];BH;048;BHR;BRN;true;officially-assigned;true;Asia and the Pacific Group;{BHD:{name:Bahraini dinar;symbol:.د.ب}};{+9;[73]};[Manama];[BH;Kingdom of Bahrain;Mamlakat al-Barayn];Asia;Western Asia;{ara:Arabic};{{مملكة البحرين;البحرين};{Rouantelezh Bahrein;Bahrein};{Království Bahrajn;Bahrajn};{Königreich Bahrain;Bahrain};{Bahreini Kuningriik;Bahrein};{Bahrainin kuningaskunta;Bahrain};{Royaume de Bahreïn;Bahreïn};{Kraljevina Bahrein;Bahrein};{Bahreini Királyság;Bahrein};{Regno del Bahrain;Bahrein};{ー�ーン王国;ー�ーン};{;};{Koninkrijk Bahrein;Bahrein};{پادشاهی بحرین;بحرین};{Klestwo Bahrajnu;Bahrajn};{Reino do Bahrein;Bahrein};{Королевство Бахрейн;Бахрейн};{Bahrajnské kľovstvo;Bahrajn};{Reino de Bahrein;Bahrein};{Kraljevina Bahrein;Bahrein};{Konungariket Bahrain;Bahrain};{Bahreyn Krallığı;Bahreyn};{مملکتِ بحرین;بحرین};{王国;}};[26;50.55];false;[];765;;{{Bahraini;Bahraini};{Bahreïnienne;Bahreïnien}}
... (truncated)
large_non_uniform_nested_mixed.json — Original: 2402 chars — Tokenizer: deepseek (deepseek-ai/DeepSeek-V3)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)2,4028023.03.0
JSON (min)1,5004575.33.3
CSVN/A
TSVN/A
YAML1,5735334.53.0
TOON1,7665454.43.2
TSON1,2754894.92.6
minemizer1,2033896.23.1
minemizer (compact)1,0723856.22.8
JSON (pretty)
chars: 2,402 tokens: 802 chars_og/tok: 3.0 enc_chars/tok: 3.0
<|begin▁of▁sentence|>[↵
· {↵
··· "id":·1,↵
··· "name": "Alice",↵
··· "work": {↵
····· "title": "Senior Engineer",↵
····· "years":·5,↵
····· "remote": true,↵
····· "team": "Platform"↵
··· },↵
··· "contact": {↵
····· "email": "alice@co.com"↵
··· }↵
· },↵
· {↵
··· "id":·2,↵
··· "profile": {↵
····· "age":·28,↵
····· "city": "NYC",↵
····· "verified": true
··· },↵
··· "status": "active",↵
··· "permissions": {↵
····· "admin": false,↵
····· "editor": true
... (truncated)
JSON (min)
chars: 1,500 tokens: 457 chars_og/tok: 5.3 enc_chars/tok: 3.3
<|begin▁of▁sentence|>[{"id":1,"name":"Alice","work":{"title":"Senior Engineer","years":5,"remote":true,"team":"Platform"},"contact":{"email":"alice@co.com"}},{"id":2,"profile":{"age":28,"city":"NYC","verified":true},"status":"active","permissions":{"admin":false,"editor":true}},{"id":3,"name":"Charlie","contact":{"email":"c@example.com","preferred":"email","phone":"555-0103"},"metadata":{"created":"2019-06-10"}},{"id":4,"user":{"username":"diana","role":"admin","level":5},"metadata":{"created":"2020-09-01","updated":"2024-01-20"},"settings":{"theme":"dark"}},{"id":5,"employee":{"name":"Eve Adams","department":"Sales"},"performance":{"score":85,"reviews":3},"contact":{"email":"eve@co.com","slack":"@eve"}},{"id":6,"name":"Frank","work":{"title":"Product Manager","years":8,"remote":false,"team":"Growth"},"contact":{"email":"frank@co.com","phone":"555-0106"}},{"id":7,"profile":{"age":35,"city":"LA","verified":false},"status":"inactive","permissions":{"admin":true,"editor":false},"metadata":{"created":"2018-03-15"}},{"id":8,"name":"Grace","contact":{"email":"grace@example.org","preferred":"slack","slack":"@grace"},"settings":{"theme":"light","notifications":true}},{"id":9,"user":{"username":"henry","role":"viewer","level":2},"employee":{"name":"Henry Wilson","department":"Marketing"},"performance":{"score":72,"reviews":5}},{"id":10,"name":"Iris","work":{"title":"Designer","years":3,"remote":true,"team":"Creative"},"profile":{"age":26,"city":"Austin","verified":true},"contact":{"email":"iris@co.com"}}]
CSV: N/A
TSV: N/A
YAML
chars: 1,573 tokens: 533 chars_og/tok: 4.5 enc_chars/tok: 3.0
<|begin▁of▁sentence|>- contact:↵
··· email: alice@co.com
· id:·1
· name: Alice
· work:↵
··· remote: true
··· team: Platform
··· title: Senior Engineer
··· years:·5
- id:·2
· permissions:↵
··· admin: false
··· editor: true
· profile:↵
··· age:·28
··· city: NYC
··· verified: true
· status: active
- contact:↵
··· email: c@example.com
··· phone:·555-0103
··· preferred: email
· id:·3
· metadata:↵
··· created: '2019-06-10'
... (truncated)
TOON
chars: 1,766 tokens: 545 chars_og/tok: 4.4 enc_chars/tok: 3.2
<|begin▁of▁sentence|>[10]:↵
· - id:·1
··· name: Alice
··· work:↵
····· title: Senior Engineer
····· years:·5
····· remote: true
····· team: Platform
··· contact:↵
····· email: alice@co.com
· - id:·2
··· profile:↵
····· age:·28
····· city: NYC
····· verified: true
··· status: active
··· permissions:↵
····· admin: false
····· editor: true
· - id:·3
··· name: Charlie
··· contact:↵
····· email: c@example.com
····· preferred: email
····· phone:·555-0103
... (truncated)
TSON
chars: 1,275 tokens: 489 chars_og/tok: 4.9 enc_chars/tok: 2.6
<|begin▁of▁sentence|>[{@id,name,work,contact|1,Alice,{@title,years,remote,team|"Senior Engineer",5,true,Platform},{@email|"alice@co.com"}},{@id,profile,status,permissions|2,{@age,city,verified|28,NYC,true},active,{@admin,editor|false,true}},{@id,name,contact,metadata|3,Charlie,{@email,preferred,phone|"c@example.com",email,555-0103},{@created|2019-06-10}},{@id,user,metadata,settings|4,{@username,role,level|diana,admin,5},{@created,updated|2020-09-01,2024-01-20},{@theme|dark}},{@id,employee,performance,contact|5,{@name,department|"Eve Adams",Sales},{@score,reviews|85,3},{@email,slack|"eve@co.com","@eve"}},{@id,name,work,contact|6,Frank,{@title,years,remote,team|"Product Manager",8,false,Growth},{@email,phone|"frank@co.com",555-0106}},{@id,profile,status,permissions,metadata|7,{@age,city,verified|35,LA,false},inactive,{@admin,editor|true,false},{@created|2018-03-15}},{@id,name,contact,settings|8,Grace,{@email,preferred,slack|"grace@example.org",slack,"@grace"},{@theme,notifications|light,true}},{@id,user,employee,performance|9,{@username,role,level|henry,viewer,2},{@name,department|"Henry Wilson",Marketing},{@score,reviews|72,5}},{@id,name,work,profile,contact|10,Iris,{@title,years,remote,team|Designer,3,true,Creative},{@age,city,verified|26,Austin,true},{@email|"iris@co.com"}}]
minemizer
chars: 1,203 tokens: 389 chars_og/tok: 6.2 enc_chars/tok: 3.1
<|begin▁of▁sentence|>id; name; contact{ email; ...}↵
1; Alice;{ alice@co.com}; work{ title: Senior Engineer; years:·5; remote:true; team: Platform}↵
2;;; profile{ age:·28; city: NYC; verified:true}; status: active; permissions{ admin:false; editor:true}↵
3; Charlie;{ c@example.com; preferred: email; phone:·555-0103}; metadata{ created:·2019-06-10}↵
4;;; user{ username: diana; role: admin; level:·5}; metadata{ created:·2020-09-01; updated:·2024-01-20}; settings{ theme: dark}↵
5;;{ eve@co.com; slack: @eve}; employee{ name: Eve Adams; department: Sales}; performance{ score:·85; reviews:·3}↵
6; Frank;{ frank@co.com; phone:·555-0106}; work{ title: Product Manager; years:·8; remote:false; team: Growth}↵
7;;; profile{ age:·35; city: LA; verified:false}; status: inactive; permissions{ admin:true; editor:false}; metadata{ created:·2018-03-15}↵
8; Grace;{ grace@example.org; preferred: slack; slack: @grace}; settings{ theme: light; notifications:true}↵
9;;; user{ username: henry; role: viewer; level:·2}; employee{ name: Henry Wilson; department: Marketing}; performance{ score:·72; reviews:·5}↵
10; Iris;{ iris@co.com}; work{ title: Designer; years:·3; remote:true; team: Creative}; profile{ age:·26; city: Austin; verified:true}
minemizer (compact)
chars: 1,072 tokens: 385 chars_og/tok: 6.2 enc_chars/tok: 2.8
<|begin▁of▁sentence|>id;name;contact{email;...}↵
1;Alice;{alice@co.com};work{title:Senior Engineer;years:5;remote:true;team:Platform}↵
2;;;profile{age:28;city:NYC;verified:true};status:active;permissions{admin:false;editor:true}↵
3;Charlie;{c@example.com;preferred:email;phone:555-0103};metadata{created:2019-06-10}↵
4;;;user{username:diana;role:admin;level:5};metadata{created:2020-09-01;updated:2024-01-20};settings{theme:dark}↵
5;;{eve@co.com;slack:@eve};employee{name:Eve Adams;department:Sales};performance{score:85;reviews:3}↵
6;Frank;{frank@co.com;phone:555-0106};work{title:Product Manager;years:8;remote:false;team:Growth}↵
7;;;profile{age:35;city:LA;verified:false};status:inactive;permissions{admin:true;editor:false};metadata{created:2018-03-15}↵
8;Grace;{grace@example.org;preferred:slack;slack:@grace};settings{theme:light;notifications:true}↵
9;;;user{username:henry;role:viewer;level:2};employee{name:Henry Wilson;department:Marketing};performance{score:72;reviews:5}↵
10;Iris;{iris@co.com};work{title:Designer;years:3;remote:true;team:Creative};profile{age:26;city:Austin;verified:true}
large_non_uniform_nested_numerical.json — Original: 2947 chars — Tokenizer: deepseek (deepseek-ai/DeepSeek-V3)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)2,9471,1702.52.5
JSON (min)1,8737493.92.5
CSVN/A
TSVN/A
YAML2,0858943.32.3
TOON2,3189063.32.6
TSON1,6427473.92.2
minemizer1,5346994.22.2
minemizer (compact)1,3616424.62.1
JSON (pretty)
chars: 2,947 tokens: 1,170 chars_og/tok: 2.5 enc_chars/tok: 2.5
<|begin▁of▁sentence|>[↵
· {↵
··· "id":·1,↵
··· "metrics": {↵
····· "views":·15420,↵
····· "clicks":·842,↵
····· "ctr":·0.0546,↵
····· "bounce_rate":·0.32
··· },↵
··· "revenue": {↵
····· "amount":·12499.99,↵
····· "currency_rate":·1.0
··· },↵
··· "timestamp": "2024-01-15T09:30:00Z"↵
· },↵
· {↵
··· "id":·2,↵
··· "metrics": {↵
····· "views":·8923,↵
····· "clicks":·156,↵
····· "ctr":·0.0175,↵
····· "bounce_rate":·0.67
··· },↵
··· "stats": {↵
····· "avg_time":·45.7,
... (truncated)
JSON (min)
chars: 1,873 tokens: 749 chars_og/tok: 3.9 enc_chars/tok: 2.5
<|begin▁of▁sentence|>[{"id":1,"metrics":{"views":15420,"clicks":842,"ctr":0.0546,"bounce_rate":0.32},"revenue":{"amount":12499.99,"currency_rate":1.0},"timestamp":"2024-01-15T09:30:00Z"},{"id":2,"metrics":{"views":8923,"clicks":156,"ctr":0.0175,"bounce_rate":0.67},"stats":{"avg_time":45.7,"pages_per_session":2.3,"return_rate":0.15},"timestamp":"2024-01-16T14:22:33Z"},{"id":3,"revenue":{"amount":8750.5,"tax":700.04,"net":8050.46,"currency_rate":0.92},"inventory":{"count":342,"reserved":28,"available":314}},{"id":4,"metrics":{"views":52100,"clicks":3891,"ctr":0.0747,"bounce_rate":0.21},"performance":{"latency_ms":127.5,"uptime":0.9987,"errors":3},"timestamp":"2024-01-17T08:00:00Z"},{"id":5,"stats":{"avg_time":128.9,"pages_per_session":5.7,"return_rate":0.42},"scores":{"quality":94,"relevance":87,"engagement":0.78},"dates":{"start":"2023-06-01","end":"2024-01-31"}},{"id":6,"inventory":{"count":1205,"reserved":89,"available":1116,"reorder_point":200},"pricing":{"cost":24.99,"markup":0.35,"price":33.74},"timestamp":"2024-01-18T11:45:12Z"},{"id":7,"metrics":{"views":3156,"clicks":98,"ctr":0.031,"bounce_rate":0.55},"revenue":{"amount":2150.0,"tax":172.0,"net":1978.0},"performance":{"latency_ms":89.2,"uptime":0.9995,"errors":0}},{"id":8,"scores":{"quality":78,"relevance":92,"engagement":0.65,"nps":45},"dates":{"start":"2022-11-15","end":"2024-02-28","renewal":"2024-03-01"},"budget":{"allocated":50000,"spent":42350.75,"remaining":7649.25}},{"id":9,"pricing":{"cost":149.99,"markup":0.28,"price":191.99,"discount":0.1},"inventory":{"count":56,"reserved":12,"available":44},"timestamp":"2024-01-19T16:30:45Z"},{"id":10,"metrics":{"views":128750,"clicks":9823,"ctr":0.0763,"bounce_rate":0.18},"stats":{"avg_time":312.4,"pages_per_session":8.2,"return_rate":0.58},"budget":{"allocated":125000,"spent":98420.33,"remaining":26579.67},"dates":{"start":"2023-01-01","end":"2024-12-31"}}]
CSV: N/A
TSV: N/A
YAML
chars: 2,085 tokens: 894 chars_og/tok: 3.3 enc_chars/tok: 2.3
<|begin▁of▁sentence|>- id:·1
· metrics:↵
··· bounce_rate:·0.32
··· clicks:·842
··· ctr:·0.0546
··· views:·15420
· revenue:↵
··· amount:·12499.99
··· currency_rate:·1.0
· timestamp: '2024-01-15T09:30:00Z'↵
- id:·2
· metrics:↵
··· bounce_rate:·0.67
··· clicks:·156
··· ctr:·0.0175
··· views:·8923
· stats:↵
··· avg_time:·45.7
··· pages_per_session:·2.3
··· return_rate:·0.15
· timestamp: '2024-01-16T14:22:33Z'↵
- id:·3
· inventory:↵
··· available:·314
··· count:·342
... (truncated)
TOON
chars: 2,318 tokens: 906 chars_og/tok: 3.3 enc_chars/tok: 2.6
<|begin▁of▁sentence|>[10]:↵
· - id:·1
··· metrics:↵
····· views:·15420
····· clicks:·842
····· ctr:·0.0546
····· bounce_rate:·0.32
··· revenue:↵
····· amount:·12499.99
····· currency_rate:·1.0
··· timestamp: "2024-01-15T09:30:00Z"↵
· - id:·2
··· metrics:↵
····· views:·8923
····· clicks:·156
····· ctr:·0.0175
····· bounce_rate:·0.67
··· stats:↵
····· avg_time:·45.7
····· pages_per_session:·2.3
····· return_rate:·0.15
··· timestamp: "2024-01-16T14:22:33Z"↵
· - id:·3
··· revenue:↵
····· amount:·8750.5
... (truncated)
TSON
chars: 1,642 tokens: 747 chars_og/tok: 3.9 enc_chars/tok: 2.2
<|begin▁of▁sentence|>[{@id,metrics,revenue,timestamp|1,{@views,clicks,ctr,bounce_rate|15420,842,0.0546,0.32},{@amount,currency_rate|12499.99,1.0},2024-01-15T09:30:00Z},{@id,metrics,stats,timestamp|2,{@views,clicks,ctr,bounce_rate|8923,156,0.0175,0.67},{@avg_time,pages_per_session,return_rate|45.7,2.3,0.15},2024-01-16T14:22:33Z},{@id,revenue,inventory|3,{@amount,tax,net,currency_rate|8750.5,700.04,8050.46,0.92},{@count,reserved,available|342,28,314}},{@id,metrics,performance,timestamp|4,{@views,clicks,ctr,bounce_rate|52100,3891,0.0747,0.21},{@latency_ms,uptime,errors|127.5,0.9987,3},2024-01-17T08:00:00Z},{@id,stats,scores,dates|5,{@avg_time,pages_per_session,return_rate|128.9,5.7,0.42},{@quality,relevance,engagement|94,87,0.78},{@start,end|2023-06-01,2024-01-31}},{@id,inventory,pricing,timestamp|6,{@count,reserved,available,reorder_point|1205,89,1116,200},{@cost,markup,price|24.99,0.35,33.74},2024-01-18T11:45:12Z},{@id,metrics,revenue,performance|7,{@views,clicks,ctr,bounce_rate|3156,98,0.031,0.55},{@amount,tax,net|2150.0,172.0,1978.0},{@latency_ms,uptime,errors|89.2,0.9995,0}},{@id,scores,dates,budget|8,{@quality,relevance,engagement,nps|78,92,0.65,45},{@start,end,renewal|2022-11-15,2024-02-28,2024-03-01},{@allocated,spent,remaining|50000,42350.75,7649.25}},{@id,pricing,inventory,timestamp|9,{@cost,markup,price,discount|149.99,0.28,191.99,0.1},{@count,reserved,available|56,12,44},2024-01-19T16:30:45Z},{@id,metrics,stats,budget,dates|10,{@views,clicks,ctr,bounce_rate|128750,9823,0.0763,0.18},{@avg_time,pages_per_session,return_rate|312.4,8.2,0.58},{@allocated,spent,remaining|125000,98420.33,26579.67},{@start,end|2023-01-01,2024-12-31}}]
minemizer
chars: 1,534 tokens: 699 chars_og/tok: 4.2 enc_chars/tok: 2.2
<|begin▁of▁sentence|>id; metrics{ views; clicks; ctr; bounce_rate}; timestamp
1;{·15420;·842;·0.0546;·0.32};·2024-01-15T09:30:00Z; revenue{ amount:·12499.99; currency_rate:·1.0}↵
2;{·8923;·156;·0.0175;·0.67};·2024-01-16T14:22:33Z; stats{ avg_time:·45.7; pages_per_session:·2.3; return_rate:·0.15}↵
3;;; revenue{ amount:·8750.5; tax:·700.04; net:·8050.46; currency_rate:·0.92}; inventory{ count:·342; reserved:·28; available:·314}↵
4;{·52100;·3891;·0.0747;·0.21};·2024-01-17T08:00:00Z; performance{ latency_ms:·127.5; uptime:·0.9987; errors:·3}↵
5;;; stats{ avg_time:·128.9; pages_per_session:·5.7; return_rate:·0.42}; scores{ quality:·94; relevance:·87; engagement:·0.78}; dates{ start:·2023-06-01; end:·2024-01-31}↵
6;;·2024-01-18T11:45:12Z; inventory{ count:·1205; reserved:·89; available:·1116; reorder_point:·200}; pricing{ cost:·24.99; markup:·0.35; price:·33.74}↵
7;{·3156;·98;·0.031;·0.55};; revenue{ amount:·2150.0; tax:·172.0; net:·1978.0}; performance{ latency_ms:·89.2; uptime:·0.9995; errors:·0}↵
8;;; scores{ quality:·78; relevance:·92; engagement:·0.65; nps:·45}; dates{ start:·2022-11-15; end:·2024-02-28; renewal:·2024-03-01}; budget{ allocated:·50000; spent:·42350.75; remaining:·7649.25}↵
9;;·2024-01-19T16:30:45Z; pricing{ cost:·149.99; markup:·0.28; price:·191.99; discount:·0.1}; inventory{ count:·56; reserved:·12; available:·44}↵
10;{·128750;·9823;·0.0763;·0.18};; stats{ avg_time:·312.4; pages_per_session:·8.2; return_rate:·0.58}; budget{ allocated:·125000; spent:·98420.33; remaining:·26579.67}; dates{ start:·2023-01-01; end:·2024-12-31}
minemizer (compact)
chars: 1,361 tokens: 642 chars_og/tok: 4.6 enc_chars/tok: 2.1
<|begin▁of▁sentence|>id;metrics{views;clicks;ctr;bounce_rate};timestamp
1;{15420;842;0.0546;0.32};2024-01-15T09:30:00Z;revenue{amount:12499.99;currency_rate:1.0}↵
2;{8923;156;0.0175;0.67};2024-01-16T14:22:33Z;stats{avg_time:45.7;pages_per_session:2.3;return_rate:0.15}↵
3;;;revenue{amount:8750.5;tax:700.04;net:8050.46;currency_rate:0.92};inventory{count:342;reserved:28;available:314}↵
4;{52100;3891;0.0747;0.21};2024-01-17T08:00:00Z;performance{latency_ms:127.5;uptime:0.9987;errors:3}↵
5;;;stats{avg_time:128.9;pages_per_session:5.7;return_rate:0.42};scores{quality:94;relevance:87;engagement:0.78};dates{start:2023-06-01;end:2024-01-31}↵
6;;2024-01-18T11:45:12Z;inventory{count:1205;reserved:89;available:1116;reorder_point:200};pricing{cost:24.99;markup:0.35;price:33.74}↵
7;{3156;98;0.031;0.55};;revenue{amount:2150.0;tax:172.0;net:1978.0};performance{latency_ms:89.2;uptime:0.9995;errors:0}↵
8;;;scores{quality:78;relevance:92;engagement:0.65;nps:45};dates{start:2022-11-15;end:2024-02-28;renewal:2024-03-01};budget{allocated:50000;spent:42350.75;remaining:7649.25}↵
9;;2024-01-19T16:30:45Z;pricing{cost:149.99;markup:0.28;price:191.99;discount:0.1};inventory{count:56;reserved:12;available:44}↵
10;{128750;9823;0.0763;0.18};;stats{avg_time:312.4;pages_per_session:8.2;return_rate:0.58};budget{allocated:125000;spent:98420.33;remaining:26579.67};dates{start:2023-01-01;end:2024-12-31}
large_non_uniform_nested_text.json — Original: 4214 chars — Tokenizer: deepseek (deepseek-ai/DeepSeek-V3)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)4,2149864.34.3
JSON (min)3,3596476.55.2
CSVN/A
TSVN/A
YAML3,3877036.04.8
TOON3,5347056.05.0
TSON3,1736896.14.6
minemizer2,8095008.45.6
minemizer (compact)2,6945278.05.1
JSON (pretty)
chars: 4,214 tokens: 986 chars_og/tok: 4.3 enc_chars/tok: 4.3
<|begin▁of▁sentence|>[↵
· {↵
··· "id":·1,↵
··· "title": "Introduction to Machine Learning",↵
··· "author": {↵
····· "name": "Dr. Sarah Chen",↵
····· "affiliation": "Stanford University",↵
····· "department": "Computer Science"↵
··· },↵
··· "abstract": "A comprehensive overview of modern machine learning techniques and applications",↵
··· "tags": [↵
····· "AI",↵
····· "ML",↵
····· "deep learning"↵
··· ]↵
· },↵
· {↵
··· "id":·2,↵
··· "title": "Climate Change Impact Assessment",↵
··· "content": {↵
····· "summary": "Analysis of rising sea levels and temperature patterns",↵
····· "methodology": "longitudinal study with satellite imagery",↵
····· "conclusion": "significant acceleration observed since·2010"↵
··· },↵
··· "category": "Environmental Science"
... (truncated)
JSON (min)
chars: 3,359 tokens: 647 chars_og/tok: 6.5 enc_chars/tok: 5.2
<|begin▁of▁sentence|>[{"id":1,"title":"Introduction to Machine Learning","author":{"name":"Dr. Sarah Chen","affiliation":"Stanford University","department":"Computer Science"},"abstract":"A comprehensive overview of modern machine learning techniques and applications","tags":["AI","ML","deep learning"]},{"id":2,"title":"Climate Change Impact Assessment","content":{"summary":"Analysis of rising sea levels and temperature patterns","methodology":"longitudinal study with satellite imagery","conclusion":"significant acceleration observed since·2010"},"category":"Environmental Science"},{"id":3,"author":{"name":"Marcus Williams","affiliation":"MIT Media Lab","role":"Principal Researcher"},"publication":{"journal":"Nature Communications","volume":"fifteen","status":"peer-reviewed"},"keywords":"quantum computing, error correction, fault tolerance"},{"id":4,"title":"Urban Planning Strategies for Sustainable Cities","abstract":"Examining green infrastructure and mixed-use development patterns","content":{"summary":"Case studies from Copenhagen, Singapore, and Portland","methodology":"comparative analysis with community surveys","findings":"walkability correlates strongly with resident satisfaction"},"tags":["urban design","sustainability","planning"]},{"id":5,"publication":{"journal":"The Lancet","volume":"four hundred two","issue":"special edition","status":"published"},"content":{"summary":"Global health outcomes following pandemic response measures","conclusion":"early intervention strategies proved most effective"},"category":"Public Health"},{"id":6,"title":"Advances in Natural Language Processing","author":{"name":"Dr. James Rodriguez","affiliation":"Google Research","department":"Language Understanding"},"abstract":"Survey of transformer architectures and attention mechanisms in modern NLP systems","keywords":"transformers, attention, language models, BERT, GPT"},{"id":7,"content":{"summary":"Historical analysis of economic policy shifts in emerging markets","methodology":"archival research combined with econometric modeling","findings":"trade liberalization showed mixed results across regions","limitations":"data availability constraints for pre-1990 period"},"category":"Economics","tags":["policy","trade","development"]},{"id":8,"title":"Biodiversity Conservation in Tropical Rainforests","author":{"name":"Dr. Ana Costa","affiliation":"Brazilian Institute for Amazonian Research","role":"Lead Ecologist"},"publication":{"journal":"Conservation Biology","status":"under review"},"abstract":"Mapping species distribution patterns and identifying critical habitat corridors"},{"id":9,"title":"Behavioral Economics and Consumer Decision Making","content":{"summary":"Experimental studies on cognitive biases in purchasing behavior","methodology":"randomized controlled trials with eye-tracking technology","conclusion":"anchoring effects persist even with expert consumers"},"keywords":"behavioral economics, decision theory, consumer psychology","category":"Psychology"},{"id":10,"author":{"name":"Prof. Michael Thompson","affiliation":"Oxford University","department":"Engineering Science","role":"Department Chair"},"publication":{"journal":"Advanced Materials","volume":"thirty-six","status":"accepted"},"abstract":"Novel synthesis methods for high-performance ceramic composites","tags":["materials science","ceramics","nanotechnology"]}]
CSV: N/A
TSV: N/A
YAML
chars: 3,387 tokens: 703 chars_og/tok: 6.0 enc_chars/tok: 4.8
<|begin▁of▁sentence|>- abstract: A comprehensive overview of modern machine learning techniques and applications
· author:↵
··· affiliation: Stanford University
··· department: Computer Science
··· name: Dr. Sarah Chen
· id:·1
· tags:↵
· - AI
· - ML
· - deep learning
· title: Introduction to Machine Learning
- category: Environmental Science
· content:↵
··· conclusion: significant acceleration observed since·2010
··· methodology: longitudinal study with satellite imagery
··· summary: Analysis of rising sea levels and temperature patterns
· id:·2
· title: Climate Change Impact Assessment
- author:↵
··· affiliation: MIT Media Lab
··· name: Marcus Williams
··· role: Principal Researcher
· id:·3
· keywords: quantum computing, error correction, fault tolerance
· publication:
... (truncated)
TOON
chars: 3,534 tokens: 705 chars_og/tok: 6.0 enc_chars/tok: 5.0
<|begin▁of▁sentence|>[10]:↵
· - id:·1
··· title: Introduction to Machine Learning
··· author:↵
····· name: Dr. Sarah Chen
····· affiliation: Stanford University
····· department: Computer Science
··· abstract: A comprehensive overview of modern machine learning techniques and applications
··· tags[3]: AI,ML,deep learning
· - id:·2
··· title: Climate Change Impact Assessment
··· content:↵
····· summary: Analysis of rising sea levels and temperature patterns
····· methodology: longitudinal study with satellite imagery
····· conclusion: significant acceleration observed since·2010
··· category: Environmental Science
· - id:·3
··· author:↵
····· name: Marcus Williams
····· affiliation: MIT Media Lab
····· role: Principal Researcher
··· publication:↵
····· journal: Nature Communications
····· volume: fifteen
····· status: peer-reviewed
... (truncated)
TSON
chars: 3,173 tokens: 689 chars_og/tok: 6.1 enc_chars/tok: 4.6
<|begin▁of▁sentence|>[{@id,title,author,abstract,tags|1,"Introduction to Machine Learning",{@name,affiliation,department|"Dr. Sarah Chen","Stanford University","Computer Science"},"A comprehensive overview of modern machine learning techniques and applications",[AI,ML,"deep learning"]},{@id,title,content,category|2,"Climate Change Impact Assessment",{@summary,methodology,conclusion|"Analysis of rising sea levels and temperature patterns","longitudinal study with satellite imagery","significant acceleration observed since·2010"},"Environmental Science"},{@id,author,publication,keywords|3,{@name,affiliation,role|"Marcus Williams","MIT Media Lab","Principal Researcher"},{@journal,volume,status|"Nature Communications",fifteen,peer-reviewed},"quantum computing, error correction, fault tolerance"},{@id,title,abstract,content,tags|4,"Urban Planning Strategies for Sustainable Cities","Examining green infrastructure and mixed-use development patterns",{@summary,methodology,findings|"Case studies from Copenhagen, Singapore, and Portland","comparative analysis with community surveys","walkability correlates strongly with resident satisfaction"},["urban design",sustainability,planning]},{@id,publication,content,category|5,{@journal,volume,issue,status|"The Lancet","four hundred two","special edition",published},{@summary,conclusion|"Global health outcomes following pandemic response measures","early intervention strategies proved most effective"},"Public Health"},{@id,title,author,abstract,keywords|6,"Advances in Natural Language Processing",{@name,affiliation,department|"Dr. James Rodriguez","Google Research","Language Understanding"},"Survey of transformer architectures and attention mechanisms in modern NLP systems","transformers, attention, language models, BERT, GPT"},{@id,content,category,tags|7,{@summary,methodology,findings,limitations|"Historical analysis of economic policy shifts in emerging markets","archival research combined with econometric modeling","trade liberalization showed mixed results across regions","data availability constraints for pre-1990 period"},Economics,[policy,trade,development]},{@id,title,author,publication,abstract|8,"Biodiversity Conservation in Tropical Rainforests",{@name,affiliation,role|"Dr. Ana Costa","Brazilian Institute for Amazonian Research","Lead Ecologist"},{@journal,status|"Conservation Biology","under review"},"Mapping species distribution patterns and identifying critical habitat corridors"},{@id,title,content,keywords,category|9,"Behavioral Economics and Consumer Decision Making",{@summary,methodology,conclusion|"Experimental studies on cognitive biases in purchasing behavior","randomized controlled trials with eye-tracking technology","anchoring effects persist even with expert consumers"},"behavioral economics, decision theory, consumer psychology",Psychology},{@id,author,publication,abstract,tags|10,{@name,affiliation,department,role|"Prof. Michael Thompson","Oxford University","Engineering Science","Department Chair"},{@journal,volume,status|"Advanced Materials",thirty-six,accepted},"Novel synthesis methods for high-performance ceramic composites",["materials science",ceramics,nanotechnology]}]
minemizer
chars: 2,809 tokens: 500 chars_og/tok: 8.4 enc_chars/tok: 5.6
<|begin▁of▁sentence|>id; title; author{ name; affiliation; department; role}; abstract; content{ summary; methodology; conclusion; ...}↵
1; Introduction to Machine Learning;{ Dr. Sarah Chen; Stanford University; Computer Science;}; A comprehensive overview of modern machine learning techniques and applications;; tags[ AI; ML; deep learning]↵
2; Climate Change Impact Assessment;;;{ Analysis of rising sea levels and temperature patterns; longitudinal study with satellite imagery; significant acceleration observed since·2010}; category: Environmental Science
3;;{ Marcus Williams; MIT Media Lab;; Principal Researcher};;; publication{ journal: Nature Communications; volume: fifteen; status: peer-reviewed}; keywords: quantum computing, error correction, fault tolerance
4; Urban Planning Strategies for Sustainable Cities;; Examining green infrastructure and mixed-use development patterns;{ Case studies from Copenhagen, Singapore, and Portland; comparative analysis with community surveys;; findings: walkability correlates strongly with resident satisfaction}; tags[ urban design; sustainability; planning]↵
5;;;;{ Global health outcomes following pandemic response measures;; early intervention strategies proved most effective}; publication{ journal: The Lancet; volume: four hundred two; issue: special edition; status: published}; category: Public Health
6; Advances in Natural Language Processing;{ Dr. James Rodriguez; Google Research; Language Understanding;}; Survey of transformer architectures and attention mechanisms in modern NLP systems;; keywords: transformers, attention, language models, BERT, GPT
7;;;;{ Historical analysis of economic policy shifts in emerging markets; archival research combined with econometric modeling;; findings: trade liberalization showed mixed results across regions; limitations: data availability constraints for pre-1990 period}; category: Economics; tags[ policy; trade; development]↵
8; Biodiversity Conservation in Tropical Rainforests;{ Dr. Ana Costa; Brazilian Institute for Amazonian Research;; Lead Ecologist}; Mapping species distribution patterns and identifying critical habitat corridors;; publication{ journal: Conservation Biology; status: under review}↵
9; Behavioral Economics and Consumer Decision Making;;;{ Experimental studies on cognitive biases in purchasing behavior; randomized controlled trials with eye-tracking technology; anchoring effects persist even with expert consumers}; keywords: behavioral economics, decision theory, consumer psychology; category: Psychology
10;;{ Prof. Michael Thompson; Oxford University; Engineering Science; Department Chair}; Novel synthesis methods for high-performance ceramic composites;; publication{ journal: Advanced Materials; volume: thirty-six; status: accepted}; tags[ materials science; ceramics; nanotechnology]
minemizer (compact)
chars: 2,694 tokens: 527 chars_og/tok: 8.0 enc_chars/tok: 5.1
<|begin▁of▁sentence|>id;title;author{name;affiliation;department;role};abstract;content{summary;methodology;conclusion;...}↵
1;Introduction to Machine Learning;{Dr. Sarah Chen;Stanford University;Computer Science;};A comprehensive overview of modern machine learning techniques and applications;;tags[AI;ML;deep learning]↵
2;Climate Change Impact Assessment;;;{Analysis of rising sea levels and temperature patterns;longitudinal study with satellite imagery;significant acceleration observed since·2010};category:Environmental Science
3;;{Marcus Williams;MIT Media Lab;;Principal Researcher};;;publication{journal:Nature Communications;volume:fifteen;status:peer-reviewed};keywords:quantum computing, error correction, fault tolerance
4;Urban Planning Strategies for Sustainable Cities;;Examining green infrastructure and mixed-use development patterns;{Case studies from Copenhagen, Singapore, and Portland;comparative analysis with community surveys;;findings:walkability correlates strongly with resident satisfaction};tags[urban design;sustainability;planning]↵
5;;;;{Global health outcomes following pandemic response measures;;early intervention strategies proved most effective};publication{journal:The Lancet;volume:four hundred two;issue:special edition;status:published};category:Public Health
6;Advances in Natural Language Processing;{Dr. James Rodriguez;Google Research;Language Understanding;};Survey of transformer architectures and attention mechanisms in modern NLP systems;;keywords:transformers, attention, language models, BERT, GPT
7;;;;{Historical analysis of economic policy shifts in emerging markets;archival research combined with econometric modeling;;findings:trade liberalization showed mixed results across regions;limitations:data availability constraints for pre-1990 period};category:Economics;tags[policy;trade;development]↵
8;Biodiversity Conservation in Tropical Rainforests;{Dr. Ana Costa;Brazilian Institute for Amazonian Research;;Lead Ecologist};Mapping species distribution patterns and identifying critical habitat corridors;;publication{journal:Conservation Biology;status:under review}↵
9;Behavioral Economics and Consumer Decision Making;;;{Experimental studies on cognitive biases in purchasing behavior;randomized controlled trials with eye-tracking technology;anchoring effects persist even with expert consumers};keywords:behavioral economics, decision theory, consumer psychology;category:Psychology
10;;{Prof. Michael Thompson;Oxford University;Engineering Science;Department Chair};Novel synthesis methods for high-performance ceramic composites;;publication{journal:Advanced Materials;volume:thirty-six;status:accepted};tags[materials science;ceramics;nanotechnology]
mcp_tools_list.json — Original: 51663 chars — Tokenizer: deepseek (deepseek-ai/DeepSeek-V3)
FormatCharsTokenschars_og/tokenc_chars/tok
JSON (pretty)51,66311,3034.64.6
JSON (min)30,7246,9777.44.4
CSVN/A
TSVN/A
YAML38,1397,9976.54.8
TOON38,3767,7676.74.9
TSON25,8786,7317.73.8
minemizer23,3835,3429.74.4
minemizer (compact)21,9125,2169.94.2
JSON (pretty)
chars: 51,663 tokens: 11,303 chars_og/tok: 4.6 enc_chars/tok: 4.6
<|begin▁of▁sentence|>[↵
· {↵
··· "inputSchema": {↵
····· "json": {↵
······· "properties": {↵
········· "body": {↵
··········· "description": "Comment content",↵
··········· "type": "string"↵
········· },↵
········· "issue_number": {↵
··········· "description": "Issue number to comment on",↵
··········· "type": "number"↵
········· },↵
········· "owner": {↵
··········· "description": "Repository owner",↵
··········· "type": "string"↵
········· },↵
········· "repo": {↵
··········· "description": "Repository name",↵
··········· "type": "string"↵
········· }↵
······· },↵
······· "required": [↵
········· "owner",↵
········· "repo",
... (truncated)
JSON (min)
chars: 30,724 tokens: 6,977 chars_og/tok: 7.4 enc_chars/tok: 4.4
<|begin▁of▁sentence|>[{"inputSchema":{"json":{"properties":{"body":{"description":"Comment content","type":"string"},"issue_number":{"description":"Issue number to comment on","type":"number"},"owner":{"description":"Repository owner","type":"string"},"repo":{"description":"Repository name","type":"string"}},"required":["owner","repo","issue_number","body"],"type":"object"}},"name":"add_issue_comment","description":"Add a comment to a specific issue in a GitHub repository."},{"inputSchema":{"json":{"properties":{"body":{"description":"The text of the review comment","type":"string"},"line":{"description":"The line of the blob in the pull request diff that the comment applies to. For multi-line comments, the last line of the range","type":"number"},"owner":{"description":"Repository owner","type":"string"},"path":{"description":"The relative path to the file that necessitates a comment","type":"string"},"pullNumber":{"description":"Pull request number","type":"number"},"repo":{"description":"Repository name","type":"string"},"side":{"description":"The side of the diff to comment on. LEFT indicates the previous state, RIGHT indicates the new state","enum":["LEFT","RIGHT"],"type":"string"},"startLine":{"description":"For multi-line comments, the first line of the range that the comment applies to","type":"number"},"startSide":{"description":"For multi-line comments, the starting side of the diff that the comment applies to. LEFT indicates the previous state, RIGHT indicates the new state","enum":["LEFT","RIGHT"],"type":"string"},"subjectType":{"description":"The level at which the comment is targeted","enum":["FILE","LINE"],"type":"string"}},"required":["owner","repo","pullNumber","path","body","subjectType"],"type":"object"}},"name":"add_pull_request_review_comment_to_pending_review","description":"Add a comment to the requester's latest pending pull request review, a pending review needs to already exist to call this (check with the user if not sure)."},{"inputSchema":{"json":{"properties":{"issueNumber":{"description":"Issue number","type":"number"},"owner":{"description":"Repository owner","type":"string"},"repo":{"description":"Repository name","type":"string"}},"required":["owner","repo","issueNumber"],"type":"object"}},"name":"assign_copilot_to_issue","description":"Assign Copilot to a specific issue in a GitHub repository.\n\nThis tool can help with the following outcomes:\n- a Pull Request created with source code changes to resolve the issue\n\n\nMore information can be found at:\n- https://docs.github.com/en/copilot/using-github-copilot/using-copilot-coding-agent-to-work-on-tasks/about-assigning-tasks-to-copilot\n"},{"inputSchema":{"json":{"properties":{"body":{"description":"Review comment text","type":"string"},"commitID":{"description":"SHA of commit to review","type":"string"},"event":{"description":"Review action to perform","enum":["APPROVE","REQUEST_CHANGES","COMMENT"],"type":"string"},"owner":{"description":"Repository owner","type":"string"},"pullNumber":{"description":"Pull request number","type":"number"},"repo":{"description":"Repository name","type":"string"}},"required":["owner","repo","pullNumber","body","event"],"type":"object"}},"name":"create_and_submit_pull_request_review","description":"Create and submit a review for a pull request without review comments."},{"inputSchema":{"json":{"properties":{"branch":{"description":"Name for new branch","type":"string"},"from_branch":{"description":"Source branch (defaults to repo default)","type":"string"},"owner":{"description":"Repository owner","type":"string"},"repo":{"description":"Repository name","type":"string"}},"required":["owner","repo","branch"],"type":"object"}},"name":"create_branch","description":"Create a new branch in a GitHub repository"},{"inputSchema":{"json":{"properties":{"assignees":{"description":"Usernames to assign to this issue","items":{"type":"string"},"type":"array"},"body":{"description":"Issue body content","type":"string"},"labels":{"description":"Labels to apply to this issue","items":{"type":"string"},"type":"array"},"milestone":{"description":"Milestone number","type":"number"},"owner":{"description":"Repository owner","type":"string"},"repo":{"description":"Repository name","type":"string"},"title":{"description":"Issue title","type":"string"}},"required":["owner","repo","title"],"type":"object"}},"name":"create_issue","description":"Create a new issue in a GitHub repository."},{"inputSchema":{"json":{"properties":{"branch":{"description":"Branch to create/update the file in","type":"string"},"content":{"description":"Content of the file","type":"string"},"message":{"description":"Commit message","type":"string"},"owner":{"description":"Repository owner (username or organization)","type":"string"},"path":{"description":"Path where to create/update the file","type":"string"},"repo":{"description":"Repository name","type":"string"},"sha":{"description":"SHA of file being replaced (for updates)","type":"string"}},"required":["ow
... (truncated)
CSV: N/A
TSV: N/A
YAML
chars: 38,139 tokens: 7,997 chars_og/tok: 6.5 enc_chars/tok: 4.8
<|begin▁of▁sentence|>- description: Add a comment to a specific issue in a GitHub repository.↵
· inputSchema:↵
··· json:↵
····· properties:↵
······· body:↵
········· description: Comment content
········· type: string
······· issue_number:↵
········· description: Issue number to comment on
········· type: number
······· owner:↵
········· description: Repository owner
········· type: string
······· repo:↵
········· description: Repository name
········· type: string
····· required:↵
····· - owner
····· - repo
····· - issue_number
····· - body
····· type: object
· name: add_issue_comment
- description: Add a comment to the requester's latest pending pull request review,↵
··· a pending review needs to already exist to call this (check with the user if not
... (truncated)
TOON
chars: 38,376 tokens: 7,767 chars_og/tok: 6.7 enc_chars/tok: 4.9
<|begin▁of▁sentence|>[51]:↵
· -↵
··· inputSchema:↵
····· json:↵
······· properties:↵
········· body:↵
··········· description: Comment content
··········· type: string
········· issue_number:↵
··········· description: Issue number to comment on
··········· type: number
········· owner:↵
··········· description: Repository owner
··········· type: string
········· repo:↵
··········· description: Repository name
··········· type: string
······· required[4]: owner,repo,issue_number,body
······· type: object
··· name: add_issue_comment
··· description: Add a comment to a specific issue in a GitHub repository.↵
· -↵
··· inputSchema:↵
····· json:↵
······· properties:
... (truncated)
TSON
chars: 25,878 tokens: 6,731 chars_og/tok: 7.7 enc_chars/tok: 3.8
<|begin▁of▁sentence|>{@inputSchema(@json),name,description#51|{{@properties,required,type|{@body,issue_number,owner,repo|{@description,type|"Comment content",string},{@description,type|"Issue number to comment on",number},{@description,type|"Repository owner",string},{@description,type|"Repository name",string}},[owner,repo,issue_number,body],object}},add_issue_comment,"Add a comment to a specific issue in a GitHub repository."|{{@properties,required,type|{@body,line,owner,path,pullNumber,repo,side,startLine,startSide,subjectType|{@description,type|"The text of the review comment",string},{@description,type|"The line of the blob in the pull request diff that the comment applies to. For multi-line comments, the last line of the range",number},{@description,type|"Repository owner",string},{@description,type|"The relative path to the file that necessitates a comment",string},{@description,type|"Pull request number",number},{@description,type|"Repository name",string},{@description,enum,type|"The side of the diff to comment on. LEFT indicates the previous state, RIGHT indicates the new state",[LEFT,RIGHT],string},{@description,type|"For multi-line comments, the first line of the range that the comment applies to",number},{@description,enum,type|"For multi-line comments, the starting side of the diff that the comment applies to. LEFT indicates the previous state, RIGHT indicates the new state",[LEFT,RIGHT],string},{@description,enum,type|"The level at which the comment is targeted",[FILE,LINE],string}},[owner,repo,pullNumber,path,body,subjectType],object}},add_pull_request_review_comment_to_pending_review,"Add a comment to the requester's latest pending pull request review, a pending review needs to already exist to call this (check with the user if not sure)."|{{@properties,required,type|{@issueNumber,owner,repo|{@description,type|"Issue number",number},{@description,type|"Repository owner",string},{@description,type|"Repository name",string}},[owner,repo,issueNumber],object}},assign_copilot_to_issue,"Assign Copilot to a specific issue in a GitHub repository.\n\nThis tool can help with the following outcomes:\n- a Pull Request created with source code changes to resolve the issue\n\n\nMore information can be found at:\n- https://docs.github.com/en/copilot/using-github-copilot/using-copilot-coding-agent-to-work-on-tasks/about-assigning-tasks-to-copilot\n"|{{@properties,required,type|{@body,commitID,event,owner,pullNumber,repo|{@description,type|"Review comment text",string},{@description,type|"SHA of commit to review",string},{@description,enum,type|"Review action to perform",[APPROVE,REQUEST_CHANGES,COMMENT],string},{@description,type|"Repository owner",string},{@description,type|"Pull request number",number},{@description,type|"Repository name",string}},[owner,repo,pullNumber,body,event],object}},create_and_submit_pull_request_review,"Create and submit a review for a pull request without review comments."|{{@properties,required,type|{@branch,from_branch,owner,repo|{@description,type|"Name for new branch",string},{@description,type|"Source branch (defaults to repo default)",string},{@description,type|"Repository owner",string},{@description,type|"Repository name",string}},[owner,repo,branch],object}},create_branch,"Create a new branch in a GitHub repository"|{{@properties,required,type|{@assignees,body,labels,milestone,owner,repo,title|{@description,items,type|"Usernames to assign to this issue",{@type|string},array},{@description,type|"Issue body content",string},{@description,items,type|"Labels to apply to this issue",{@type|string},array},{@description,type|"Milestone number",number},{@description,type|"Repository owner",string},{@description,type|"Repository name",string},{@description,type|"Issue title",string}},[owner,repo,title],object}},create_issue,"Create a new issue in a GitHub repository."|{{@properties,required,type|{@branch,content,message,owner,path,repo,sha|{@description,type|"Branch to create/update the file in",string},{@description,type|"Content of the file",string},{@description,type|"Commit message",string},{@description,type|"Repository owner (username or organization)",string},{@description,type|"Path where to create/update the file",string},{@description,type|"Repository name",string},{@description,type|"SHA of file being replaced (for updates)",string}},[owner,repo,path,content,message,branch],object}},create_or_update_file,"Create or update a single file in a GitHub repository. If updating, you must provide the SHA of the file you want to update."|{{@properties,required,type|{@commitID,owner,pullNumber,repo|{@description,type|"SHA of commit to review",string},{@description,type|"Repository owner",string},{@description,type|"Pull request number",number},{@description,type|"Repository name",string}},[owner,repo,pullNumber],object}},create_pending_pull_request_review,"Create a pending review for a pull request. Call this first before attempting to add comments to a pending review, and ultimately submitting it
... (truncated)
minemizer
chars: 23,383 tokens: 5,342 chars_og/tok: 9.7 enc_chars/tok: 4.4
<|begin▁of▁sentence|>inputSchema{ json{ properties{ owner{ description; type}; repo{ description; type}; ...}; required[]; type}}; name; description
{{ {{ Repository owner; string};{ Repository name; string}; body:{ description: Comment content; type: string}; issue_number:{ description: Issue number to comment on; type: number}};[ owner; repo; issue_number; body]; object}}; add_issue_comment; Add a comment to a specific issue in a GitHub repository.↵
{{ {{ Repository owner; string};{ Repository name; string}; body:{ description: The text of the review comment; type: string}; line:{ description: The line of the blob in the pull request diff that the comment applies to. For multi-line comments, the last line of the range; type: number}; path:{ description: The relative path to the file that necessitates a comment; type: string}; pullNumber:{ description: Pull request number; type: number}; side:{ description: The side of the diff to comment on. LEFT indicates the previous state, RIGHT indicates the new state; enum:[ LEFT; RIGHT]; type: string}; startLine:{ description: For multi-line comments, the first line of the range that the comment applies to; type: number}; startSide:{ description: For multi-line comments, the starting side of the diff that the comment applies to. LEFT indicates the previous state, RIGHT indicates the new state; enum:[ LEFT; RIGHT]; type: string}; subjectType:{ description: The level at which the comment is targeted; enum:[ FILE; LINE]; type: string}};[ owner; repo; pullNumber; path; body; subjectType]; object}}; add_pull_request_review_comment_to_pending_review; Add a comment to the requester's latest pending pull request review, a pending review needs to already exist to call this (check with the user if not sure).↵
{{ {{ Repository owner; string};{ Repository name; string}; issueNumber:{ description: Issue number; type: number}};[ owner; repo; issueNumber]; object}}; assign_copilot_to_issue; Assign Copilot to a specific issue in a GitHub repository.↵↵
This tool can help with the following outcomes:↵
- a Pull Request created with source code changes to resolve the issue↵↵↵
More information can be found at:↵
- https://docs.github.com/en/copilot/using-github-copilot/using-copilot-coding-agent-to-work-on-tasks/about-assigning-tasks-to-copilot↵↵
{{ {{ Repository owner; string};{ Repository name; string}; body:{ description: Review comment text; type: string}; commitID:{ description: SHA of commit to review; type: string}; event:{ description: Review action to perform; enum:[ APPROVE; REQUEST_CHANGES; COMMENT]; type: string}; pullNumber:{ description: Pull request number; type: number}};[ owner; repo; pullNumber; body; event]; object}}; create_and_submit_pull_request_review; Create and submit a review for a pull request without review comments.↵
{{ {{ Repository owner; string};{ Repository name; string}; branch:{ description: Name for new branch; type: string}; from_branch:{ description: Source branch (defaults to repo default); type: string}};[ owner; repo; branch]; object}}; create_branch; Create a new branch in a GitHub repository
{{ {{ Repository owner; string};{ Repository name; string}; assignees:{ description: Usernames to assign to this issue; items:{ type: string}; type: array}; body:{ description: Issue body content; type: string}; labels:{ description: Labels to apply to this issue; items:{ type: string}; type: array}; milestone:{ description: Milestone number; type: number}; title:{ description: Issue title; type: string}};[ owner; repo; title]; object}}; create_issue; Create a new issue in a GitHub repository.↵
{{ {{ Repository owner (username or organization); string};{ Repository name; string}; branch:{ description: Branch to create/update the file in; type: string}; content:{ description: Content of the file; type: string}; message:{ description: Commit message; type: string}; path:{ description: Path where to create/update the file; type: string}; sha:{ description: SHA of file being replaced (for updates); type: string}};[ owner; repo; path; content; message; branch]; object}}; create_or_update_file; Create or update a single file in a GitHub repository. If updating, you must provide the SHA of the file you want to update.↵
{{ {{ Repository owner; string};{ Repository name; string}; commitID:{ description: SHA of commit to review; type: string}; pullNumber:{ description: Pull request number; type: number}};[ owner; repo; pullNumber]; object}}; create_pending_pull_request_review; Create a pending review for a pull request. Call this first before attempting to add comments to a pending review, and ultimately submitting it. A pending pull request review means a pull request review, it is pending because you create it first and submit it later, and the PR author will not see it until it is submitted.↵
{{ {{ Repository owner; string};{ Repository name; string}; base:{ description: Branch to merge into; type: string}; body:{ description: PR description; type: string}; draft:{ description: Create as draft PR; type: boolean}; head:{ description: Branch containing changes; type: string}; maintainer_can_modify:{ description: Allow maintainer edits; type: boolean}; title:{ description: PR title; type: string}};[ owner; repo; title; head; base]; object}}; create_pull_request; Create a new pull request in a GitHub repository.↵
{{ {;; autoInit:{ description: Initialize with README; type: boolean}; description:{ description: Repository description; type: string}; name:{ description: Repository name; type: string}; private:{ description: Whether repo should be private; type: boolean}};[ name]; object}}; create_repository; Create a new GitHub repository in your account
{{ {{ Repository owner (username or organization); string};{ Repository name; string}; branch:{ description: Branch to delete the file from; type: string}; message:{ description: Commit message; type: string}; path:{ description: Path to the file to delete; type: string}};[ owner; repo; path; message; branch]; object}}; delete_file; Delete a file from a GitHub repository
{{ {{ Repository owner; string};{ Repository name; string}; pullNumber:{ description: Pull request number; type: number}};[ owner; repo; pullNumber]; object}}; delete_pending_pull_request_review; Delete the requester's latest pending pull request review. Use this after the user decides not to submit a pending review, if you don't know if they already created one then check first.↵
{{ {;; state:{ description: The new state of the notification (read/done); enum:[ read; done]; type: string}; threadID:{ description: The ID of the notification thread; type: string}};[ threadID]; object}}; dismiss_notification; Dismiss a notification by marking it as read or done
{{ {{ Repository owner; string};{ Repository name; string}; organization:{ description: Organization to fork to; type: string}};[ owner; repo]; object}}; fork_repository; Fork a GitHub repository to your account or specified organization
{{ {{ The owner of the repository.; string};{ The name of the repository.; string}; alertNumber:{ description: The number of the alert.; type: number}};[ owner; repo; alertNumber]; object}}; get_code_scanning_alert; Get details of a specific code scanning alert in a GitHub repository.↵
{{ {{ Repository owner; string};{ Repository name; string}; page:{ description: Page number for pagination (min·1); minimum:·1; type: number}; perPage:{ description: Results per page for pagination (min·1, max·100); maximum:·100; minimum:·1; type: number}; sha:{ description: Commit SHA, branch name, or tag name; type: string}};[ owner; repo; sha]; object}}; get_commit; Get details for a commit from a GitHub repository
... (truncated)
minemizer (compact)
chars: 21,912 tokens: 5,216 chars_og/tok: 9.9 enc_chars/tok: 4.2
<|begin▁of▁sentence|>inputSchema{json{properties{owner{description;type};repo{description;type};...};required[];type}};name;description
{{{{Repository owner;string};{Repository name;string};body:{description:Comment content;type:string};issue_number:{description:Issue number to comment on;type:number}};[owner;repo;issue_number;body];object}};add_issue_comment;Add a comment to a specific issue in a GitHub repository.↵
{{{{Repository owner;string};{Repository name;string};body:{description:The text of the review comment;type:string};line:{description:The line of the blob in the pull request diff that the comment applies to. For multi-line comments, the last line of the range;type:number};path:{description:The relative path to the file that necessitates a comment;type:string};pullNumber:{description:Pull request number;type:number};side:{description:The side of the diff to comment on. LEFT indicates the previous state, RIGHT indicates the new state;enum:[LEFT;RIGHT];type:string};startLine:{description:For multi-line comments, the first line of the range that the comment applies to;type:number};startSide:{description:For multi-line comments, the starting side of the diff that the comment applies to. LEFT indicates the previous state, RIGHT indicates the new state;enum:[LEFT;RIGHT];type:string};subjectType:{description:The level at which the comment is targeted;enum:[FILE;LINE];type:string}};[owner;repo;pullNumber;path;body;subjectType];object}};add_pull_request_review_comment_to_pending_review;Add a comment to the requester's latest pending pull request review, a pending review needs to already exist to call this (check with the user if not sure).↵
{{{{Repository owner;string};{Repository name;string};issueNumber:{description:Issue number;type:number}};[owner;repo;issueNumber];object}};assign_copilot_to_issue;Assign Copilot to a specific issue in a GitHub repository.↵↵
This tool can help with the following outcomes:↵
- a Pull Request created with source code changes to resolve the issue↵↵↵
More information can be found at:↵
- https://docs.github.com/en/copilot/using-github-copilot/using-copilot-coding-agent-to-work-on-tasks/about-assigning-tasks-to-copilot↵↵
{{{{Repository owner;string};{Repository name;string};body:{description:Review comment text;type:string};commitID:{description:SHA of commit to review;type:string};event:{description:Review action to perform;enum:[APPROVE;REQUEST_CHANGES;COMMENT];type:string};pullNumber:{description:Pull request number;type:number}};[owner;repo;pullNumber;body;event];object}};create_and_submit_pull_request_review;Create and submit a review for a pull request without review comments.↵
{{{{Repository owner;string};{Repository name;string};branch:{description:Name for new branch;type:string};from_branch:{description:Source branch (defaults to repo default);type:string}};[owner;repo;branch];object}};create_branch;Create a new branch in a GitHub repository
{{{{Repository owner;string};{Repository name;string};assignees:{description:Usernames to assign to this issue;items:{type:string};type:array};body:{description:Issue body content;type:string};labels:{description:Labels to apply to this issue;items:{type:string};type:array};milestone:{description:Milestone number;type:number};title:{description:Issue title;type:string}};[owner;repo;title];object}};create_issue;Create a new issue in a GitHub repository.↵
{{{{Repository owner (username or organization);string};{Repository name;string};branch:{description:Branch to create/update the file in;type:string};content:{description:Content of the file;type:string};message:{description:Commit message;type:string};path:{description:Path where to create/update the file;type:string};sha:{description:SHA of file being replaced (for updates);type:string}};[owner;repo;path;content;message;branch];object}};create_or_update_file;Create or update a single file in a GitHub repository. If updating, you must provide the SHA of the file you want to update.↵
{{{{Repository owner;string};{Repository name;string};commitID:{description:SHA of commit to review;type:string};pullNumber:{description:Pull request number;type:number}};[owner;repo;pullNumber];object}};create_pending_pull_request_review;Create a pending review for a pull request. Call this first before attempting to add comments to a pending review, and ultimately submitting it. A pending pull request review means a pull request review, it is pending because you create it first and submit it later, and the PR author will not see it until it is submitted.↵
{{{{Repository owner;string};{Repository name;string};base:{description:Branch to merge into;type:string};body:{description:PR description;type:string};draft:{description:Create as draft PR;type:boolean};head:{description:Branch containing changes;type:string};maintainer_can_modify:{description:Allow maintainer edits;type:boolean};title:{description:PR title;type:string}};[owner;repo;title;head;base];object}};create_pull_request;Create a new pull request in a GitHub repository.↵
{{{;;autoInit:{description:Initialize with README;type:boolean};description:{description:Repository description;type:string};name:{description:Repository name;type:string};private:{description:Whether repo should be private;type:boolean}};[name];object}};create_repository;Create a new GitHub repository in your account
{{{{Repository owner (username or organization);string};{Repository name;string};branch:{description:Branch to delete the file from;type:string};message:{description:Commit message;type:string};path:{description:Path to the file to delete;type:string}};[owner;repo;path;message;branch];object}};delete_file;Delete a file from a GitHub repository
{{{{Repository owner;string};{Repository name;string};pullNumber:{description:Pull request number;type:number}};[owner;repo;pullNumber];object}};delete_pending_pull_request_review;Delete the requester's latest pending pull request review. Use this after the user decides not to submit a pending review, if you don't know if they already created one then check first.↵
{{{;;state:{description:The new state of the notification (read/done);enum:[read;done];type:string};threadID:{description:The ID of the notification thread;type:string}};[threadID];object}};dismiss_notification;Dismiss a notification by marking it as read or done
{{{{Repository owner;string};{Repository name;string};organization:{description:Organization to fork to;type:string}};[owner;repo];object}};fork_repository;Fork a GitHub repository to your account or specified organization
{{{{The owner of the repository.;string};{The name of the repository.;string};alertNumber:{description:The number of the alert.;type:number}};[owner;repo;alertNumber];object}};get_code_scanning_alert;Get details of a specific code scanning alert in a GitHub repository.↵
{{{{Repository owner;string};{Repository name;string};page:{description:Page number for pagination (min·1);minimum:1;type:number};perPage:{description:Results per page for pagination (min·1, max·100);maximum:100;minimum:1;type:number};sha:{description:Commit SHA, branch name, or tag name;type:string}};[owner;repo;sha];object}};get_commit;Get details for a commit from a GitHub repository
... (truncated)